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TCTGTGGTTT GTCAGACCTG 
CTGAACCGCA CTGAAGAACT 
GTCTTAGTCC TGCAGAATCA 
AGTTCTCTGT TCCTGAGGAA 
AAAAAAAGCC TGATTAAAGA 
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CAAGCAAGCC 
CTTGTCCTCA 
GGAGTCACCA 
CTAAATTTAA 
GTTTCTGCCT 



CCCTGCTGGG 
CTGGCTGATG 
GATGATGCAG 
GGAAAAAATG 
GTTAAAAAAA 



GAAGCCTAGG 
CAGCAGAACT 
AGTTGAGATC 
GGATTTTGTT 
AAAAAAAAAA 



TGTCCTTGAG 22 80 

CTTGGGAAAT 23 40 

ATCATTGCAA 2400 

TTAGAGTTGG 2460 
AAAAAA 
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MSGRRTRSGG AAQRSGPRAP SPTKPLRRSQ RKSGSELPSI IiPElWPKTPS AAAVRKP 1VL 

KRIVAHAVEV PAVQSPRRSP RISFFLEKEN EPPGRELTKE DLFKTHSVPA TPTSTPVPNP 

EABSSSKEGE LDARDLEMSK KVRRSYSRLE TLGSASTSTP GRRSCFGFEG LLGAEDLSGV 

SPWCSKLTE VPRVCAKPWA PDMTLPGISP PPEKQKRKKK KMPEIIiKTEL DEWAAAMNAE 

FEAAEQFDLL VE 

Seq ID NO: 98 DMA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 58-12444 
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85 



GGGGCATTTC 
GCGGGCTCCG 
GCGGACCGCT 
TGCGTCCTGA 
GATTTCGGTT 
AGAGAAGAAA 
CCTTACTCTG 
AAATGTAAAA 
AGACT CATGG 
TTGAAAAAAA 
GGTGAAGTTC 
GGTGAACTTA 
GGATGTCTGA 
CCCCAGACTT 
CTGAAGAGAT 
TTTAGCACCT 
GCCCACACAA 
CAGGTTTCTA 
ATGGAGCAGT 
GCTATCCGTG 
GACTTCATGT 
ACTGGTGACG 
CTGTACCTTG 
CAGATAGACA 
GTGAAGGTGT 
GTGGTGCATC 
GAGT CTGAAT 
CCCACATACA 
GATTCTATTT 
CATTTACTTT 
ACACTTGAAA 
ATGATCCCAA 
GCTTTCATTA 
TTTGAACCAT 
CTCATCAGTG 
TATTTCGAGG 
TCTTGCTTTG 
AAAGATGAAC 
GAACTCGATG 
TATACCCCCT 
AGACATGTAA 
ACTTCAGCCT 
GCCCAGAAAG 
T CAAACGAAG 
CTAGGAGGAC 
AGCTATGTGG 
AAACCTGTCA 
AGTGACAGAC 
TTGGGCAAAG 
TATAAG CGG A 
CAACTGTATG 
GAAAGTCAGG 
GACAGTACTT 
AAGCAAATAA 
CGACTTTATA 
TTTAATAATA 
GAAGCCTTGG 
GGTACAATTC 
CATGTTT CTT 
TCATTGTGTT 
GAATGTCGAC 
AGATCCCCTA 
AACACCTTTG 
TTGTACCTTC 



CGGGTCCGGG 
GAGCCGGTGT 
GCGGTGCTGC 
GCAGCAGCCC 
TGCTTGTATT 
TCCTAAAGTT 
TTGAAATTAA 
TTCCAGCCCT 
ATGAATTTAA 
AAATACCAGA 
ATCCTAGTGA 
AGACCCAGAT 
AGGGGTTGTC 
CAAGGGAGAT 
ATGCTGTGCC 
GCCTTCTGGA 
ATGTAGAATT 
ATATGGTGGC 
TTTATGGAAT 
GATATGGACT 
ACGTTGAGCT 
ACCGTGTTTA 
ACACAGTTCC 
GTTTCCCACA 
TCCTAGCTTT 
AGGGTTTAAT 
CTGAAGACCA 
AAGACTACGT 
TAGCAGATGA 
ATGATGAATT 
TACAGACTGT 
CTTCAGATCC 
ACCTGGTGGA 
GGGTGTACTC 
GTTTCTACAA 
GAGTTAGTCC 
CTTTATTTGT 
TTTTGGCCTC 
TTAGAGCCTA 
TGGCAGAAGT 
TGCAGCCTTA 
TGT CAGATG A 
GATTTAATAA 
CAATATCCTT 
AAATAAACAA 
CCTGGGACAG 
TTTTCCTGGA 
AAACTAAAGT 
CCACGCAGAT 
CGTTTCCTGT 
AGCCACTAGT 
ATACTGTTGC 
TAAGAGATTT 
CACCACAGCA 
GCCTTGCGCT 
TCTACAGGGA 
TGATATACAT 
AACAGTGTTG 
TAAATAAAGC 
TATTGGATCT 
ACAAATCCAT 
ATTTGTGGCT 
AGGGGGGTGG 
GGGGGCCATT 



CCGAGCGGGC 
GCGTTGCTCC 
CCTGGCCGGT 
CGCGGTGCTG 
TGT CCGGAAG 
TTTATGTATT 
GAACACTTGT 
GGACCTTCTT 
AATTGGAGAA 
TACAGTTTTA 
GATGATAAAT 
GACATCAGCA 
CTCACTTCTG 
TTTTAATTTT 
CTCAGCTGGC 
CAACTACGTG 
GAAAAAAGCT 
GAAAAATGCA 
CAT CAGAAAT 
TTTTGCAGGA 
CATTCAGCGC 
TCAGATGCCA 
TGAGGTGTAT 
GTACAGTCCA 
GGCAGCAAAA 
CAGAATATGT 
CCGTGCTTCA 
GGATCTCTTC 
AGCATTTTTC 
TGTAAAATCC 
TGGGGAACAA 
AG CGG G T AAC 
ATTTTGCAGA 
ATTTTCATAT 
ATTGCTTTCT 
AAAGAGTCTG 
GAAATTTGGC 
TTGTTTGACC 
CGTTCCTGCA 
AGGCCTGAAT 
TTACAAAGAC 
GACCAAGAAT 
AGTGGTGTTA 
AGAAGAAATA 
AAATCTTCTG 
AGAGAAGCGG 
TGTGTTCCTG 
TGCAGCCTGT 
GCCAGAAGGG 
GCTGCTTCGA 
TATGCAGCTG 
CTTACTAGAA 
TTGTGGTCGG 
GCAGGAGAAG 
TCACCCCAAT 
ATTCAGGGAA 
GGAGAGTCTG 
TGATGCCATT 
AAAGAAACGA 
GGT CAAGTGG 
TGAACTCTTT 
GAAAGATGTT 
CTGTGGCCAG 
CAGCCTGCAG 



31 

I 

GCACGCGCGG 
CTGCTGCGGC 
CATCAACTGA 
GCATTACAGA 
TCACTCAACA 
TTCTTAGAAA 
ACCAGTGTTT 
ATTAAGTTAC 
TTATTTAGTA 
GAAAAAGTAT 
AATGCAGAAA 
GTAAGAGAGC 
TGCAACTTCA 
GTACTAAAGG 
TTGCGCCTAT 
TCTCTATTTG 
GCACTTTCAG 
GAAATGCATA 
GTGGATTCGA 
CCGTGCAAGG 
TGCAAGCAGA 
AGCTTCCTCC 
ACTCCAGTTC 
AAAATGCAGC 
GGGCCAGTTC 
TCTAAACCAG 
GGGGAAGTCA 
AGACATCTCC 
TCTGTGAATT 
GTTTTGAAGA 
GAGAATGGAG 
TTGCATCCAG 
GAGATTCTCC 
GAATTAATTT 
ATTACAGTAA 
AAACACTCTC 
AAAGAGGTGG 
TTTCTTCTGT 
CTGCAGATGG 
GCTCTAGAAG 
ATTCTCCCCT 
AACTGGGAAG 
AAGCATCTGA 
AGAATTAGAG 
ACAGTCACGT 
CTGAGCTTTG 
CCTCGAGTCA 
GAACTTTTAC 
GGACAGGGAG 
CTTGCGTGTG 
ATTCACTGGT 
GCTATATTGG 
TGT ATT CGAG 
AGTCCAGTAA 
GCTTTCAAGA 
GAAGAGTCTC 
GCCTTAGCAC 
GATCACCTAT 
CGTTTGCCGC 
CTTTTAGCTC 
TATAAATTCG 
CT CAAGGAAG 
CCCTCGGGCA 
GCCACGCTAT 



41 
i 

GAGCGGGACT 
TGCAGGAGAC 
TCCGCGGCCT 
CATCTTTAGT 
GTATTGAATT 
AAATGGGCCA 
ATACAAAAGA 
TTCAGACTTT 
AATTCTATGG 
ATGAGCTCCT 
ACCTGTTCCG 
CCAAACTACC 
CTAAGTCCAT 
CAATTCGTCC 
TTGCCCTGCA 
AAGTCTTGTT 
CCCTGGAATC 
AAAATAAACT 
ACAACAAGGA 
TTATAAACGC 
TGTTCCTCAC 
AGTCTGTTGC 
TGGAGCACCT 
TGGTGTGTTG 
TCAGGAATTG 
TGGTCCTTCC 
GAACTGGCAA 
TGAG CTCTGA 
CCTCCAGTGA 
TTGTTGAGAA 
ATGAGGCGCC 
CTAAACCTAA 
CTGAGAAACA 
TGCAATCTAC 
GAAATGCCAA 
CTGAAGACCC 
CAGTTAAAAT 
CCTTGCCACA 
CTTTCAAACT 
AATGGTCAAT 
GCCTGGATGG 
TGTCAGCTCT 
AGAAGACAAA 
TAGTACAAAT 
CCTCAGATGA 
CAGTGCCCTT 
CAGAAT T AGC 
ATAGCATGGT 
CCCCACCCAT 
ATGTTGATCA 
TCACTAACAA 
ATGGAATTGT 
AATTCCTTAA 
ACACCAAATC 
GGCTGGGAGC 
TGGTGGAACA 
ATGCAGATGA 
GCCGCATCAT 
GAGGATTTCC 
AT TGTGGGAG 
TTCCTTTATT 
AAGGTGTCTC 
TCCTGGCCCA 
GCTGGCTGGA 



51 
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CGGCGGCATG 

CTTGTCCGCT 

GGGG CAGGAA 

TTTTTCCAGA 

TCGTGAATGT 

GAAGATCGCA 

TAGAGCTGCT 

TAGAAGTTCT 

AGAACTTGCA 

AGGATTATTG 

CGCTTTTCTG 

TGTTCTGGCA 

GGAAGAAGAT 

TCAGATTGAT 

TGCATCT CAG 

AAAGTGGTGT 

CTTTCTGAAA 

GCAGTACTTT 

GTTATCTATT 

AAAAGATGTT 

CCAGACAGAC 

AAGCGTCTTG 

CGTGGTGATG 

CAGAGCCATA 

CATTAGTACT 

AAAGGGCCCT 

ATGGAAGGTG 

CCAGATGATG 

AAGT CTGAAT 

ATTGGATCTT 

TGGTGTTTGG 

AGATTTTTCG 

AG CAGAATTT 

AAGGTTGCCC 

GAAAATAAAA 

AGAAAAGTAT 

GAAGCAGTAC 

CAACATCATT 

GGGCCTGAGC 

TTATATTGAC 

ATACCTGAAG 

TTCTCGGGCT 

GAACCTTTCA 

GCTTGGATCT 

GATGATGAAG 

TAGAGAGATG 

GCTCACAGCC 

TATGTTTATG 

GTACCAGCTC 

GGTGACAAGG 

CAAGAAATTT 

GGACCCTGTT 

ATGGTCCATT 

GCTTTTCAAG 

ATCACTTGCC 

GTTTGTGTTT 

GAAGTCCTTA 

TGAAAAGAAG 

ACCTTCCGCA 

GCCCCAGACA 

GCCAGGCAAC 

TTTTCTCATC 

GCCCACCCTC 

CCTGCTCCTG 
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420 
480 
540 
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720 
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3540 
3600 
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3720 
3780 
3840 
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GCCGCGTTGG AGTGCTACAA CACGTTCATT 
CTAGGTACTG AAGCCCAGTC TTCACTTTTG 
GCCATGCATG AC AT TAT AG C AGCAGAAAAG 
ACAAGCCCAC AAGAGGGAGA AAGGTACAAC 
5 ATGGAGTTTA CCACGACTCT GCTAAACACC 

GACTTGTGTA ATACACACCT GATGAGAGTC 
ATAGGTTTCA ACATCGGAGA CGTCCAGGTT 
CTGATGAAAG CTCTAAAGAT GTCCCCATAC 
AAAATAACAG CACAGAGCAT TGAGGAGCTT 

10 CAAGTGGACA GGAGCAGGCT GGCTGCTGTT 

GGGCTTCTGC ATAATATATT ACCGTCTCAG 
GAACTTCTTT CCCTGGTTTA TAAAGGCATT 
TCTCTAGACC TCAGTTGTAA GCAGCTGGCC 
GGAGGACTGT GTGAGCGCCT TGTGAGTCTT 

15 TCCTTGGGCA GCTCACAGGG CAGCGTCATC 

TTGTTCTCAG AAACG AT CAA CACGGAATTA 
CTCATGCAGT CTTCAGTGGA TAATACCAAA 
GACCAGAGCT TCAGGGAGCG AGCAAACCAG 
ATTCTGCAAC ACTGGAAGAA GTGTGATTCA 

20 AAAATGGCAG TGCTGGCCTT ACTGGCAAAA 

AATACAAGTC ATGGTTCATT CCCTGAAGTC 
ACAAAGCTGG ATCTACATTT AAAGGGCCAA 
CTCACTGGAG GCAGTCTGGA GGAACTTAGA 
TTCCCCATGC AGTCCAGGGA ATTTCCTCCA 

25 TGCATGAAAA AGTTTCTAGA TGCATTGGAA 

ATGACAGAAG TTCTTTGTCG GG AACAGCAG 
TTCAGGAGGA TTGCCAGAAG GGGTTCATGT 
TATGAAATGT T C AGGAAGG A TGACCCCCGC 
CGCTCCCTCC TCACTCTGCT GTGGCACTGT 

30 ACAATTGTGG TGGATGCCAT TGATGTGTTG 

ACCTTTGATA CTCAAATCAC CAAGAAGATG 
TCTCGCCTTC CCAAAGATGA TGTTCATGCT 
GGCT CGTGT A TTACAGAAGG AAATGAACTT 
GCATTTACAG AGAACATGGC AGGAGAGAAT 

35 TGTGCAGCAT ACAACTGCGC CAT ATCTGT C 

TACCAAGGTT TTCTGTTTAG TGAAAAACCA 
ATCGACCTGA AGCGCCGCTA TAATTTTCCT 
AAAAAGTACA TTGAAATTAG GAAAGAAGCC 
CCTTCCTATA TGTCTTCCCT GTCATATTTG 

40 CAATTTGATT TCTCAACCGG AGTT CAGAGC 

GCCACTGGTC GTTTTCGGAG ACGGGAGCAG 
GAGCTGGAGA TGGACGAGCT CAATCGGCAT 
AAGCACATGC ACAGAAGCCT GGGCCCGCCT 
CTTCCTTCTT GGATGAAATT CCTCCATGGC 

45 ATCCGTCTCT TCTTAGCCAA GCTTGTTATT 

AAGCACTGGC TTAGCCCCTT GCTGCAGCTG 
ATTCACTACA TGGTGGTTGA GATAGTGGCC 
CCAACAGGGG TCCCTAAAGA TGAAGTGTTA 
CATGTCTTTC ATCCAAAAAG AGCTGTGTTT 

50 GTCGAGTGCT GGAAGGATTG TTTATCCATC 

GGTAAAGATC CTAATTCTAA AGACAACTCA 
GCCAATGACC TGCCTCCCTA TGACCCACAG 
GCTTTGGTGA ATAATATGT C CTTTGTAAGA 
GTT CTAGGAC TTATACTTCG ATATGTTATG 

55 TGTGAACTGG TTGCGAAACA ATTGAAGCAA 

GTGTGCTTGA ACAAAGTGAC CAAGAGCTTC 
GTGTTCTTTC TGCTGCCAAA ATTTCATGGA 
CTTTGTCGTG TGGAGGGAAT GACAGAGCTG 
CAAGTCATGA GACATAGAGA TGATGAAAGA 

60 ATGATGCCAA AGTTAAAACC AGTAGAACTC 

GTTTCCCATC CTTCTACAAC ATGTAGGGAA 
GATAATTACA GAGATCCAGA AAGTGAGACA 
GCAAAAGATG TGCTGATTCA AGGATTGATC 
CGAAATTTCT GGAGCCATGA AACTAGGTTA 

65 CTAAATTCCT TATATTCTCC TAAGATAGAA 

CTGCTCGAAA TG ACCAG CAT GAGCCCAGAT 
TCAGAATGCG AATTT CAGGA ATATACCATT 
CTCACTCCGA TGTTTGTGGA GACCCAGGCC 
GAAGGGTCCC TCTCAGCTCG CTGGCCAGTG 

70 CATGACTTCA CACTGACACA GACTGCAGAT 

AGCAGCACTG ACCCGCTGGT CGACCACACC 
CACAAGAGGA GTGAAAGGTT ACAGAGAGCA 
AAAAAAAGGC TGGGCCTTCC AGGGGACGAG 
CGGACGGACC TACTACGACT GCGCAGACGG 

75 ATGTATGCCA GAAAAGGCGT TGCTGAGCAA 

AAAATGAAGC AGGATGCCCA GGTCGTTCTG 
GACATTCAGA TCAAGCACAG CAGCCTCATC 
CCAATAATTG CAAAACAGCT CTTTAGCAGC 
AAATTTAAGA CACTGTCTGA AAAAAACAAC 

80 CGTTTTCTTA ATACCACCTT CTCTTTCTTT 

AGCTGTCAGC ACGCAGCCCT GCTGAGCCTC 
GCCAGCCTAC AGCAGCCCGT GGGCATCCGC 
CCTGCTGAGC TGCCTGCCAA GCGAGT CCGT 
AGATGGGTGG AGCTTGCTAA GCTGTATAGA 

85 ATTTTTACCA GTGAGATAGG AACAAAGCAA 

AG AAGTG AT T AT T C TGAAGC TGCTAAGCAG 
GTAGATGGTG AGCCCACAGA AGCCGAGAAG 



GGCGAGAGAA CTGTAGGAGC GCTCCAGGTC 3 900 

AAAGCAGTGG CTTTCTTCTT AGAAAGCATT 3 960 

TGCTTTGGCA CTGGGGCAGC AGGTAACAGA 4020 

TACAGCAAAT GCACCGTTGT GGTCCGGATT 4080 

TCCCCGGAAG GATGGAAGCT CCTGAAGAAG 4140 

CTGGTGCAGA CGCTGTGTGA GCCCGCAAGC 42 00 

ATGGCTCATC TTCCTGATGT TTGTGTGAAT 4260 

AAAGATATCC TAGAGACCCA TCTGAGAGAG 4320 

TGTGCCGTCA ACTTGTATGG CCCTGACGCG 43 80 

GTGTCTGCCT GTAAACAGCT TCACAGAGCT 4440 

TCCACAGATT TGCATCATTC TGTTGGCACA 4500 

GCCCCTGGAG ATGAGAGACA GTGTCTGCCT 4560 

AGCGGACTTC TGGAGTTAGC CTTTGCTTTT 4620 

CTCCTGAACC CAGCGGTGCT GTCCACGGCG 4680 

CACTTCTCCC ATGGGGAGTA TTTCTATAGC 4740 

TTGAAAAATC TGGATCTTGC TGTATTGGAG 480 0 

ATGGTGAGTG CCGTTTTGAA CGGCATGTTA 4860 

AAACACCAAG GACTGAAACT TGCGACTACA 4920 

TGGTGGGCCA AAGATTCCCC TCTCGAAACT 4980 

ATTTTACAGA TTGATTCATC TGTATCTTTT 5040 

TTTACAACAT ATATTAGTCT ACTTGCTGAC 510 0 

GCTGTCACTC TTCTTCCATT CTTCACCAGC 5160 

CGTGTTCTGG AGCAGCTCAT CGTTGCTCAC 5220 

GGAACTCCGC GGTT CAATAA TTATGTGGAC 52 80 

TTATCTCAAA GCCCTATGTT GTTGGAATTG 5340 

CATGTCATGG AAGAATTATT TCAATCCAGT 540 0 

GT CACACAAG TAGGCCTTCT GGAAAGCGTG 54 60 

CTAAGTTTCA CACGCCAGTC CTTTGTGGAC 552 0 

AGCCTGGATG CTTTGAGAGA ATTCTTCAGC 5580 

AAGTCCAGGT TTACAAAGCT AAATGAATCT 5640 

GGCTACTATA AGATTCTAGA CGTGATGTAT 5700 

AAGGAATCAA AAATTAAT CA AGTTTTCCAT 5760 

ACAAAGACAT TGATTAAATT GTGCTACGAT 5820 

CAGCTGCTGG AGAGGAGAAG ACTTTACCAT 5880 

ATCTGCTGTG TCTTCAATGA GTTAAAATTT 5940 

GAAAAGAACT TGCTTATTTT TGAAAATCTG 6000 

GTAGAAGTTG AGGTTCCTAT GGAAAGAAAG 6060 

AGAGAAGCAG CAAATGGGGA TTCAGATGGT 6120 

GCAGACAGTA CCCTGAGTGA GGAAATGAGT 6180 

TATTCATACA GCTCCCAAGA CCCTAGACCT 6240 

CGGGACCCCA CGGTGCATGA TGATGTGCTG 6300 

GAGTGCATGG CGCCCCTGAC GGCCCTGGTC 6360 

CAAGGAGAAG AGGATTCAGT GCCAAGAGAT 6420 

AAACTGGGAA ATCCAATAGT ACCATTAAAT 6480 

AATACAGAAG AGGTCTTTCG CCCTTACGCG 6540 

GCTGCTTCTG AAAACAATGG AGGAGAAGGA 660 0 

ACTATTCTTT CATGGACAGG CTTGGCCACT 6660 

GCAAAT CGAT TGCTTAATTT CCTAATGAAA 6720 

AGACACAACC TTGAAATTAT AAAGACCCTT 6780 

CCTTATAGGT TAATATTTGA AAAGTTTTCC 6840 

GTAGGGATTC AATTGCTAGG CATCGTGATG 6900 

TGTGGCATCC AGAGTAGCGA ATACTTCCAG 6 960 

TATAAAGAAG TGTATGCCGC TGCAGCAGAA 7020 

GAGAGAAAAA ACATACTGGA GGAGTCTCTG 7080 

CATCAGAATA CTATGGAGGA CAAGTTTATT 7140 

CCTCCTCTTG CAGACAGGTT CATGAATGCT 7200 

GTGTTGAAAA CACTCTGTCT GGAGGTGGTA 72 60 

TACTTCCAGT TAAAGAGCAA GGACTTCGTT 7320 

CAAAAAGTAT GTTTGGACAT AATTTATAAG 7380 

CGAGAACTTC TGAACCCCGT TGTGGAATTC 7440 

CAAATGTATA ATATTCTCAT GTGGATTCAT 7500 

GATAATGACT CCCAGGAAAT ATTTAAGTTG 7560 

GATGAGAACC CTGGACTTCA ATTAATTATT 7620 

CCTTCAAATA CCTTGGACCG GTTGCTGGCA 7680 

GTGCACTTTT TAAGTTTAGC AACAAATTTT 7740 

TATCCAAACC CCATGTTCGA GCATCCTCTG 7800 

GATTCTGATT GGCGTTTCCG AAGTACTGTT 7860 

TCCCAGGGCA CTCTCCAGAC CCGTACCCAG 7920 

GCAGGGCAGA TAAGGGCCAC CCAGCAGCAG 7980 

GGAAGAAGCT CATTTGATTG GCTGACCGGG 8040 

AGTCCCTCAT CTGACTCCTT GCTGTTTGCC 8100 

CCCTTGAAGT CAGTGGGGCC TGATTTTGGG 8160 

GTGGATAACA AAGTGAAAGG TGCGGCCGGC 8220 

TTTATGAGGG ACCAGGAGAA GCTCAGTTTG 8280 

AAACGAGAGA AGGAAATCAA GAGTGAGTTA 8340 

TACAGAAGCT ACCGGCACGG AGACCTTCCT 8400 

ACCCCGTTAC AGGCCGTGGC CCAGAGGGAC 8460 

TTGTTTTCTG GAATTTTGAA AGAGATGGAT 8520 

ATCACTCAAA AGTTGCTTCA AGACTTCAAT 8580 

CCACCCTTTG TCTCTTGTAT TCAGGACATT 8640 

GACCCAGCGG CTGTTAGCGC TGGTTGCCTG 8700 

CTGCTAGAGG AGGCTCTGCT CCGCCTGCTG 8760 

GGGAAGGCCC GCCTCCCTCC TGATGTCCTC 882 0 

TCAATTGGAG AATACGACGT CCTCCGTGGG 8880 

AT CACT CAGA GTGCATTATT AGCAGAAGCC 8940 

TATGATGAGG CTCTCAATAA ACAAGACTGG 9000 

GATTTTTGGG AACTTGCATC CCTTGACTGT 9060 
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TACAACCACC TTGCTGAGTG GAAATCACTT GAATACTGTT CTACAGCCAG TATAGACAGT 912 0 

GAGAACCCCC CAGACCTAAA TAAAATCTGG AGTGAACCAT TTTATCAGGA AACATATCTA 9180 

CCTTACATGA TCCGCAGCAA GCTGAAGCTG CTGCTCCAGG GAGAGGCTGA CCAGTCCCTG 9240 

CTGACATTTA TTGACAAAGC TATGCACGGG GAGCTCCAGA AGGCGATTCT AGAGCTTCAT 9300 

5 TACAGTCAAG AGCTGAGTCT GCTTTACCTC CTGCAAGATG ATGTTGACAG AGCCAAATAT 9360 

TACATTCAAA ATGGCATTCA GAGTTTTATG CAGAATTATT CTAGTATTGA TGTCCTCTTA 9420 

CACCAAAGTA GACTCACCAA ATTGCAGTCT GTACAGGCTT TAACAGAAAT TCAGGAGTTC 9480 

ATCAGCTTTA TAAGCAAACA AGGCAATTTA TCATCTCAAG TTCCCCTTAA GAGACTTCTG 9540 

AACACCTGGA CAAACAGATA TCCAGATGCT AAAATGGACC CAATGAACAT CTGGGATGAC 9600 

10 ATCATCACAA ATCGATGTTT CTTTCTCAGC AAAATAGAGG AGAAGCTTAC CCCTCTTCCA 9660 

GAAGATAATA GTATGAATGT GGATCAAGAT GGAGACCCCA GTGACAGGAT GGAAGTGCAA 972 0 

GAGCAGGAAG AAGATATCAG CTCCCTGATC AGGAGTTGCA AGTTTTCCAT GAAAATGAAG 9780 

ATGATAGACA GTGCCCGGAA GCAGAACAAT TTCTCACTTG CTATGAAACT ACTGAAGGAG 9840 

CTGCATAAAG AGTCAAAAAC CAGAGACGAT TGGCTGGTGA GCTGGGTGCA GAGCTACTGC 9900 

15 CGCCTGAGCC ACTGCCGGAG CCGGTCCCAG GGCTGCTCTG AGCAGGTGCT CACTGTGCTG 9960 

AAAACAGTCT CTTTGTTGGA TGAGAACAAC GTGTCAAGCT ACTTAAGCAA AAATATTCTG 10020 

GCTTTCCGTG ACCAGAACAT TCTCTTGGGT ACAACTTACA GGATCATAGC GAATGCTCTC 10080 

AGCAGTGAGC CAGCCTGCCT TGCTGAAATC GAGGAGGACA AGGCTAGAAG AATCTTAGAG 10140 

CTTTCTGGAT CCAGTTCAGA GGATTCAGAG AAGGTGATCG CGGGTCTGTA CCAGAGAGCA 10200 

20 TTCCAGCACC TCTCTGAGGC TGTGCAGGCG GCTGAGGAGG AGGCCCAGCC TCCCTCCTGG 10260 

AGCTGTGGGC CTGCAGCTGG GGTGATTGAT GCTTACATGA CGCTGGCAGA TTTCTGTGAC 10320 

CAACAGCTGC GCAAGGAGGA AGAGAATGCA TCAGTTATTG ATTCTGCAGA ACTGCAGGCG 10380 

TATCCAGCAC TTGTGGTGGA GAAAATGTTG AAAGCTTTAA AATTAAATTC CAATGAAGCC 10440 

AGATTGAAGT TTCCTAGATT ACTTCAGATT ATAGAACGGT ATCCAGAGGA GACTTTGAGC 1050 0 

25 CTCATGACAA AAGAGATCTC TTCCGTTCCC TGCTGGCAGT TCATCAGCTG GATCAGCCAC 10560 

ATGGTGGCCT TACTGGACAA AGACCAAGCC GTTGCTGTTC AGCACTCTGT GGAAGAAATC 10 620 

ACTGATAACT ACCCGCAGGC TATTGTTTAT CCCTTCATCA TAAGCAGCGA AAGCTATTCC 10680 

TTCAAGGATA CTTCTACTGG T CAT AAGAAT AAGGAGTTTG TGGCAAGGAT TAAAAGTAAG 10740 

TTGGATCAAG GAGGAGTGAT TCAAGATTTT ATTAATGCCT TAGATCAGCT CTCTAATCCT 10800 

30 GAACTGCTCT TTAAGGATTG GAGCAATGAT GTAAGAGCTG AACTAGCAAA AACCCCTGTA 10860 

AATAAAAAAA ACATTGAAAA AATGTATGAA AGAATGTATG CAGCCTTGGG TGACCCAAAG 10 920 

GCTCCAGGCC TGGGGGCCTT TAGAAGGAAG TTTATTCAGA CTTTTGGAAA AGAATTTGAT 10980 

AAACATTTTG GGAAAGGAGG TTCTAAACTA CTGAGAATGA AGCTCAGTGA CTTCAACGAC 11040 

ATTACCAACA TGCTACTTTT AAAAATGAAC AAAGACT CAA AGCCCCCTGG GAATCTGAAA 11100 

35 GAATGTTCAC CCTGGATGAG CGACTTCAAA GTGGAGTTCC TGAGAAATGA GCTGGAGATT 11160 

CCCGGTCAGT ATGACGGTAG GGGAAAGCCA TTGCCAGAGT ACCACGTGCG AATCGCCGGG 11220 

TTTGATGAGC GGGTGACAGT CATGGCGTCT CTGCGAAGGC CCAAGCGCAT CATCATCCGT 11280 

GGCCATGACG AGAGGGAACA CCCTTTCCTG GTGAAGGGTG GCGAGGACCT GCGGCAGGAC 113 40 

CAGCGCGTGG AGCAGCT CTT CCAGGTCATG AATGGGATCC TGGCCCAAGA CTCCGCCTGC 11400 

40 AGCCAGAGGG CCCTGCAGCT GAGGACCTAT AGCGTTGTGC CCATGACCTC CAGGTTAGGA 11460 

TTAATTGAGT GGCTTGAAAA TACTGTTACC TTGAAGGACC TTCTTTTGAA CACCATGTCC 11520 

CAAGAGGAGA AGGCGGCTTA CCTGAGTGAT CCCAGGGCAC CGCCGTGTGA ATATAAAGAT 11580 

TGGCTGACAA AAATGTCAGG AAAACATGAT GTTGGAGCTT ACATGCTAAT GTATAAGGGC 11640 

GCTAATCGTA CTGAAACAGT CACGTCTTTT AGAAAACGAG AAAGTAAAGT GCCTGCTGAT 11700 

45 CTCTTAAAGC GGGCCTTCGT GAGGATGAGT ACAAGCCCTG AGGCTTTCCT GGCGCTCCGC 11760 

TCCCACTTCG CCAGCTCTCA CGCTCTGATA TGCATCAGCC ACTGGATCCT CGGGATTGGA 11820 

GACAGACATC TGAACAACTT TATGGTGGCC ATGGAGACTG GCGGCGTGAT CGGGATCGAC 11880 

TTTGGGCATG CGTTTGGATC CGCTACACAG TTTCTGCCAG TCCCTGAGTT GATGCCTTTT 11940 

CGGCTAACTC GCCAGTTTAT CAAT CTGATG TTACCAATGA AAGAAACGGG CCTTATGTAC 12 000 

50 AGCAT CATGG TACACGCACT CCGGGCCTTC CGCTCAGACC CTGGCCTGCT CACCAACACC 12 0 60 

ATGGATGTGT TTGTCAAGGA GCCCTCCTTT GATTGGAAAA ATTTTGAACA GAAAATGCTG 12120 

AAAAAAGGAG GGTCATGGAT TCAAGAAATA AATGTTGCTG AAAAAAATTG GTACCCCCGA 12180 

CAGAAAATAT GTTACGCTAA GAGAAAGTTA GCAGGTGCCA ATCCAGCAGT CATTACTTGT 12240 
GATGAGCTAC TCCTGGGTCA TGAGAAGGCC CCTGCCTTCA GAGACTATGT GGCTGTGGCA 12300 

55 CGAGGAAGCA AAGATCACAA CATTCGTGCC CAAGAACCAG AGAGTGGGCT TTCAGAAGAG 12360 

ACTCAAGTGA AGTGCCTGAT GGACCAGGCA ACAGACCCCA ACATCCTTGG CAGAACCTGG 12420 

GAAGGATGGG AG CC C T GG AT GTGAGGTCTG TGGGAGTCTG CAGATAGAAA GCATTACATT 12480 

GTTTAAAGAA T C T AC TAT AC TTTGGTTGGC AGCATTCCAT GAGCTGATTT TCCTGAAACA 12540 

CTAAAGAGAA ATGTCTTTTG TGCTACAGTT TCGTAGCATG AGTTTAAATC AAGATTATGA 12 600 

60 TGAGTAAATG TGTATGGGTT AAATCAAAGA TAAGGTTATA GTAACATCAA AGATTAGGTG 12660 

AGGTTTATAG AAAGATAGAT ATCCAGGCTT ACCAAAGTAT TAAGTCAAGA ATATAATATG 1272 0 

TGATCAGCTT TCAAAGCATT TACAAGTGCT GCAAGTTAGT GAAACAGCTG TCTCCGTAAA 12780 

TGGAGGAAAT GTGGGGAAGC CTTGGAATGC CCTTCTGGTT CTGGCACATT GGAAAGCACA 12840 
CTCAGAAGGC TTCATCACCA AGATTTTGGG AGAGTAAAGC TAAGTATAGT TGATGTAACA 12 90 0 

65 TTGTAGAAGC AGCAT AGGAA CAATAAGAAC AATAGGTAAA GCTATAATTA TGGCTTATAT 12960 

TTAGAAATGA CTGCATTTGA TATTTTAGGA TATTTTTCTA GGTTTTTTCC TTTCATTTTA 13020 

TTCTCTTCTA GTTTTGACAT TTTATGATAG ATTTGCTCTC TAGAAGGAAA CGTCTTTATT 13080 

TAGGAGGGCA AAAATTTTGG TCATAGCATT CACTTTTGCT ATTCCAATCT ACAACTGGAA 13140 

GATACATAAA AGTGCTTTGC ATTGAATTTG GGATAACTTC AAAAATCCCA TGGTTGTTGT 13200 

70 TAGGGATAGT ACTAAGCATT TCAGTTCCAG GAGAATAAAA GAAATTCCTA TTTGAAATGA 13260 

ATTCCTCATT TGGAGGAAAA AAAGCATGCA TTCTAGCACA ACAAGATGAA ATTATGGAAT 13320 

ACAAAAGTGG CTCCTTCCCA TGTGCAGTCC CTGTCCCCCC CCGCCAGTCC TCCACACCCA 133 80 
AACTGTTTCT GATTGGCTTT TAGCTTTTTG TTGTTTTTTT TTTTCCTTCT AACACTTGTA 13440 

TTTGGAGGCT CTTCTGTGAT TTTGAGAAGT ATACTCTTGA GTGTTTAATA AAGTTTTTTT 13500 
CCAAAAGTA 



75 



Seq ID NO: 99 Protein sequence: 
Protein Accession #: NP_008835.5 



80 1 11 21 31 41 51 

II I I I I 

MAGSGAGVRC SLLRLQETLS AADRCGAALA GHQLIRGLGQ ECVLSSSPAV LALQTSLVFS 60 

RDFGLLVFVR KSLNSIEFRE CREE I LKFLC IFLEKMGQKI APYSVEIKNT CTSVYTKDRA 120 

AKCKIPALDL LIKLLQTFRS SRLMDEFKIG ELFSKFYGEL ALKKKI PDTV LEKVYELLGL 180 

85 LGEVHPSEMI NNAENLFRAF LGELKTQMTS AVREPKLPVL AGCLKGLSSL LCNFTKSMEE 240 

DPQTSREIFN FVLKAIRPQI DLKRYAVP S A GLRLFALHAS QFSTCLLDNY VSLFEVLLKW 300 

CAHTNVELKK AALSALESFL KQVSNMVAKN AEMHKNKLQY FMEQFYGIIR NVDSNNKELS 3 60 



227 



10 



15 



20 
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30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 
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IAIRGYGLFA GPCKVINAKD 
LLYLDTVPEV YTPVLEHLW 
TWHQGLIRI CSKPWLPKG 
MDSILADEAF FSVNSSSESL 
WMIPTSDPAA NLHPAKPKDF 
PLISGFYKLL S I T VRNAKK I 
YKDELLASCL TFLLSLPHNI 
DRHVMQPYYK DILPCLDGYL 
SSNEAISLEE IRIRWQMLG 
MKPVIFLDVF LPRVTELALT 
LYKRTFPVLL RLACDVDQVT 
VDSTLRDFCG RCIREFLKWS 
AFNNIYREFR EEESLVEQFV 
KHVSLNKAKK RRLPRGFPPS 
NRSPNLWLKD VLKEEGVSFL 
LAAIiECYNTF IGERTVGALQ 
RTSPQEGERY NYSKCTWVR 
SIGFNIGDVQ VMAHLPDVCV 
AQVDRSRLAA WSACKQLHR 
PSLDLSCKQL ASGLLELAFA 
SLFSETINTE LLKNLDLAVL 
TILQHWKKCD SWWAKDSPLE 
DTKLDLHLKG QAVTLLPFFT 
DCMKKFLDAL ELSQSPMLLE 
VYEMFRKDDP RLSFTRQSFV 
STFDTQITKK MGYYKILDVM 
DAFTENMAGE NQBLERRRLY 
LIDLKRRYNF PVEVEVPMER 
SQFDFSTGVQ SYSYSSQDPR 
VKHMHR SLGP PQGEEDSVPR 
AKHWLSPLLQ LAASENNGGE 
KHVFHPKRAV FRHNLE I I KT 
MANDLPPYDP QCGIQSSEYF 
LCELVAKQLK QHQNTMEDKF 
VLCRVEGMTE LYFQLKSKDF 
FVSHPSTTCR EQMYNILMWI 
IRNFWSHETR LPSNTLDRIiL 
LSECEFQEYT IDSDWRFRST 
QHDFTLTQTA DGRSSFDWLT 
GKKRLGLPGD EVDNKVKGAA 
LKMKQDAQW LYRSYRHGDL 
DKFKTLSEKN NITQKLLQDF 
LASLQQPVGI RLLEEALLRL 
GIFTSEIGTK QITQSALLAE 
CYNHLAEWKS LEYCSTAS ID 
LLTFIDKAMH GELQKAILEL 
LHQSRLTKLQ SVQALTEIQE 
DIITNRCFFIi SKIEEKLTPL 
KMIDSARKQN NFSLAMKLLK 
LKTVSLLDEN NVSSYLSKNI 
ELSGSSSEDS EKVIAGLYQR 
DQQLRKEEEN ASVIDSAELQ 
SLMTKEISSV PCWQFISWIS 
SFKDTSTGHK NKEFVARIKS 
VNKKNIEKMY ERMYAALGDP 
DITNMLLLKM NKDSKPPGNL 
GFDERVTVMA SLRRPKRIII 
CSQRALQLRT YSWPMTSRL 
DWLTKMSGKH DVGAYMLMYK 
RSHFAS SHAL ICISHWILGI 
FRLTRQFINL MIiPMKETGLM 
LKKGGSWIQE INVAEKNWYP 
ARGSKDHNIR AQEPESGLSE 
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VDFMYVELIQ 
MQIDSFPQYS 
PESESEDHRA 
NHLLYDEFVK 
SAFINLVEFC 
KYFEGVSPKS 
I ELDVRAYVP 
KTSALSDETK 
SLGGQINKNL 
ASDRQTKVAA 
RQLYEPLVMQ 
IKQITPQQQE 
FEALVIYMES 
AS LCLLDLVK 
INTFEGGGCG 
VLGTEAQSSL 
IMEFTTTLLN 
NLMKALKMSP 
AGLLHNILPS 
FGGLCERIiVS 
ELMQSSVDNT 
TKMAVLALLA 
SLTGGSLEEL 
LMTEVLCREQ 
DRSLLTLLWH 
YSRLPKDDVH 
HCAAYNCA I S 
KKKYIEIRKE 
PATGRFRRRE 
DLPSWMKFLH 
GIHYMWEIV 
LVECWKDCLS 
QALVNNMSFV 
IVCLNKVTKS 
VQVMRHRDDE 
HDNYRDPESE 
ALNSLYSPKI 
VLTPMFVETQ 
GSSTDPLVDH 
GRTDLLRLRR 
PDIQIKHSSL 
NRFLNTTFSF 
IiPAELPAKRV 
ARSDYSEAAK 
SENPPDLNKI 
HYSQELSLLY 
FISFISKQGN 
PEDNSMNVDQ 
ELHKES KTRD 
LAFRDQNILL 
AFQHLSEAVQ 
AYPALWEKM 
HMVALLDKDQ 
KLDQGGVIQD 
KAPGLGAFRR 
KECSPWMSDF 
RGHDEREHPF 
GLIEWLENTV 
GANRTETVTS 
GDRHLNNFMV 
YS I MVHALRA 
RQKICYAKRK 
ETQVKCLMDQ 



RCKQMFLTQT 
PKMQLVCCRA 
SGEVRTGKWK 
SVLKIVEKLD 
REI LPEKQAE 
LKHSPEDPEK 
ALQMAFKLGL 
NNWEVSALSR 
LTVTSSDEMM 
CELLHSMVMF 
LIHWFTNNKK 
KSPVNTKSLF 
LALAHADEKS 
WLLAHCGRPQ 
QPSGILAQPT 
LKAVAFFIiES 
TSPEGWKLLK 
YKDILETHLR 
QSTDLHHSVG 
LLLNPAVLST 
KMVSAVLNGM 
KILQIDSSVS 
RRVLEQLIVA 
QHVMEELFQS 
CSLDALREFF 
AKESKINQVF 
VICCVFNELK 
AREAANGDSD 
QRDPTVHDDV 
GKLGNPIVPL 
ATILSWTGLA 
IPYRLIFEKF 
RYKEVYAAAA 
FPPLADRFMN 
RQKVCLDI I Y 
TDNDSQEIFK 
EVHFLSLATN 
ASQGTLQTRT 
TSPSSDSLLF 
RFMRDQEKLS 
ITPLQAVAQR 
FPPFVSCIQD 
RGKARLPPDV 
QYDEALNKQD 
WSEPFYQETY 
LLQDDVDRAK 
LSSQVPLKRL 
DGDPSDRMEV 
DWLVSWVQSY 
GTTYRI I ANA 
AAEEEAQPPS 
LKAIiKLNSNE 
AVAVQHSVEE 
FINALDQLSN 
KFIQTFGKEF 
KVEFIiRNELE 
LVKGGEDLRQ 
TLKDLLLNTM 
FRKRESKVPA 
AMETGGVIGI 
FRSDPGLIiTN 
LAGANPAVIT 
ATDPNILGRT 



DTGDDRVYQM 
IVKVFLALAA 
VPTYKDYVDL 
LTLEIQTVGE 
FFEPWVYSFS 
YSCFALFVKF 
SYTPLAEVGL 
AAQKGFNKW 
KSYVAWDREK 
MLGKATQMPE 
FESQDTVALL 
KRLYSLALHP 
LGTIQQCCDA 
TECRHKSIEL 
LLYLRGPFSL 
IAMHDI IAAE 
KDLCNTHLMR 
EKITAQSIEE 
TELLSLVYKG 
ASLGSSQGSV 
LDQSFRERAN 
FNTSHGSFPE 
HFPMQSREFP 
SFRRIARRGS 
STIWDAIDV 
HGSCITEGNE 
FYQGFLFSEK 
GPSYMSSLSY 
LELEMDELNR 
NIRLFLAKLV 
TPTGVPKDEV 
SGKDPNSKDN 
EVLGLILRYV 
AVFFLLPKFH 
KMMPKLKPVE 
LAKDVIiIQGL 
FLLEMTSMSP 
QEGSLSARWP 
AHKRSERLQR 
LMYARKGVAE 
DPIIAKQL.FS 
ISCQHAALLS 
LRWVELAKLY 
WVDGEPTEAE 
LPYMIRSKLK 
YYIQNGIQSF 
LNTWTNRYPD 
QEQEEDISSL 
CRLSHCRSRS 
LSSEPACLAE 
WSCGPAAGVI 
ARLKFPRLLQ 
ITDNYPQAIV 
PELLFKDWSN 
DKHFGKGGSK 
I PGQYDGRGK 
DQRVEQLFQV 
SQEEKAAYLS 
DLLKRAFVRM 
DFGHAFGSAT 
TMDVFVKEPS 
CDELLLGHEK 
WEGWEPWM 



PSFLQSVASV 
KGPVLRNCIS 
FRHLLSSDQM 
QENGDEAPGV 
YELILQSTRL 
GKEVAVKMKQ 
NALEEWSIYI 
LKHLKKTKNL 
RLSFAVPFRE 
GGQGAPPMYQ 
EAILDGIVDP 
NAFKRLGASL 
IDHLCRIIEK 
FYKFVPLLPG 
QATLCWLDLL 
KCFGTGAAGN 
VLVQTLCEPA 
LCAVNLYGPD 
IAPGDERQCL 
IHFSHGEYFY 
QKHQGLKLAT 
VFTTYISLLA 
PGTPRFNNYV 
CVTQVGLLES 
LKSRFTKLNE 
LTKTLIKLCY 
PEKNLLIFEN 
LADSTLSEEM 
HECMAPLTAL 
INTEEVFRPY 
LANRLLNFLM 
SVGIQLLGIV 
MERKNILEES 
GVLKTLCLEV 
LRELLNPWE 
IDENPGLQLI 
DYPNPMFEHP 
VAGQIRATQQ 
APLKSVGPDF 
QKREKEIKSE 
SLFSGILKEM 
LDPAAVSAGC 
RSIGEYDVLR 
KDFWELASLD 
LLLQGEADQS 
MQNYSSIDVL 
AKIVIDPMNIWD 
IRSCKFSMKM 
QGCSEQVLTV 
IEEDKARRIL 
DAYMTLADFC 
IIERYPEETL 
YPFIISSESY 
DVRAELAKTP 
LLRMKLSDFN 
PLPEYHVRIA 
MNGILAQDSA 
DPRAP PCEYK 
STSPEAFLAL 
QFLPVPELMP 
FDWKNFEQKM 
APAFRDYVAV 



Seq ID NO: 100 DNA sequence 
Nucleic Acid Accession #: NM_000673 
Coding sequence: 101-1225 



85 



ATGTGAAGGC 
GTCTATGTTT 
TATTAAATGC 
AGAAGTTGCC 
TCGCACAGAT 
ACATGAGGCA 
TGACAAAGTC 
AGATGGCAAC 
CACCAGATTT 
CGAGTACACA 
GAAAGTCTGT 
CAAGGTCAAA 
CATCATGGGC 
CAAATTTGAG 
CAAACCCATC 
AGTTATTGGG 
GACCAGCGTG 



I 1 • 

ACAAGCTGCT 
GCAGAAATAC 
AAAGCAGCTG 
CCACCAAAGA 
GACCATGTGA 
ACTGGGATTG 
ATCCCTCTCT 
CTTTGCATTA 
ACATGCAAGG 
GTGGTGGATG 
TTAATTGGCT 
CCTGGTTCCA 
TGTAAGTCAG 
AAGGCCATGG 
AGTGAGGTGC 
CATCTTGAAA 
GTTGTAGGAG 



21 
I 

GTTATATACA 
AGATCCAAGA 
TGCTTTGGGA 
CTAAAGAAGT 
TAAAAGGAAC 
TAGAGAGCAT 
TTCTGCCACA 
GGAGCGATAT 
GCAAACCAGT 
AATCTTCTGT 
GTGGGTTTTC 
CTTGCGTCGT 
CTGGTGCATC 
CTGTAGGTGC 
TGTCAGAAAT 
CCATGATTGA 
TTCCTCCATC 



31 
I 

ACAGAGTGAA 
CAAAGACAGG 
GCAGAAGCAA 
TCGCATTAAG 
AATGGTGTCC 
TGGAGAAGGA 
ATGTAGAGAA 
TACTGGTCGT 
ACACCACTTC 
TGCTAAGATT 
CACTGGATAT 
CTTTGGCCTG 
TAGGATCATT 
CACTGAGTGT 
GACAGGCAAC 
TGCCCTGGCA 
AGCCAAGATG 



41 
I 

CTGAG CATCA 
ATGGGCACTG 
CCCTTCTCCA 
ATTTTGGCCA 
AAGTTTCCAG 
GTGACTACAG 
TGCAATGCTT 
GGAGTACTGG 
ATGAACACCA 
GATGATGCAG 
GGCGCTGCTG 
GGAGGAGTTG 
GGGATTGACC 
ATCAGTCCCA 
AACGTGGGAT 
TCCTGCCACA 
CTCACCTATG 



51 

I 

GTCAGAAAAA 
CTGGAAAAGT 
TTGAGGAAAT 
CAGGAATCTG 
TGATTGTGGG 
TGAAACCAGG 
GTCGCAACCC 
CTGATGGCAC 
GTACATTTAC 
CTCCTCCTGA 
TTAAAACTGG 
GCCTGTCAGT 
TCAACAAAGA 
AGGACTCTAC 
ACACCTTTGA 
TGAACTATGG 
ACCCGATGTT 



420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2 940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 



228 



10 



15 



WO 02/086443 

GCTCTTCACT GGACGCACAT 
TGTCCCAAAA CTAGTGACTG 
TCATGTTTTA CCATTTAAAA 
CATTCGAACG GTCCTGACGT 
GAACTGGAGT TTCTCTTGTG 
ACAAGCATAA GTAGAAGATT 
TATAAACATT TAAAGTCTTG 
TTGATTTACA TTTTGTAAGG 
TATGTTGAAA TGGAGATTTT 
CAGATATAGC GTATAAAGAT 
TTGAAACTAT TATTTTTTAG 
TAACTTGGAT TACATTTTGA 
AGAAAGACAG AAAAGATTAA 
ATAACTTGGT GAAACTGAAA 
TATTAATATT TTAGAAAATA 
ATATTATCAT ACTT AT CAT A 
CCTATTCACT GTGCTTAGTA 
CTAAACCG 
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GGAAGGGATG 
AGTT CCTGGC 
AAAT CAGTGA 
TTTGAGATCC 
AGAGTTCCCT 
TGTTGAAGAC 
TGAGCACCTG 
CTATAATTGT 
TAAGAGTTTT 
ATAGTAAATG 
ATTTGAATAT 
AATCAGTTCA 
GGGACGGGCA 
AAGTATATCA 
TTCCTTTTGT 
ATGTTCAATT 
GTGACTCCAT 



TGTCTTTGGA 
AAAGAAATTT 
AGGATTTGAG 
AAAGTGGCAG 
CATCTGAAAT 
ATAGAACCCT 
GGAATTAGTA 
ATCTTTTAAG 
AACCAGCTGC 
CATCTCCCAG 
AAATGTATTT 
TTCCATGATG 
CATTTTTCAA 
TATGGGTACA 
AATACTGAAT 
TGATACAGTA 
TTAATAAAAA 



GGTTTGAAAA 
GACCTGGACC 
CTGCTCAATT 
GAGGTCTGTG 
CATGTATCTG 
TATAAAGAAT 
TAATAACAAT 
AAAACATACA 
TGCAGATATA 
AGTAATATTC 
TTTAAACACT 
CATATTACTG 
CGATTAAGAA 
CAAGGCTATT 
ATAAACATAG 
GAATTGCAAG 
GTGTTTTTAG 



GCAGAGATGA 1080 

AGTTGATAAC 1140 

CAGGACAAAG 1200 

TTGTCATGGT 1260 

TCTCACAAAT 1320 

T ATT AACCTT 13 80 

GTTAATATTT 1440 

CTTGGATTTC 1500 

TAACTCAAAA 1560 

ACTTAACACA 1620 

TGTTATGAGT 1680 

GAT TAG AT T A 1740 

TCATCATTAC 1800 

TGCCAGCATA 1860 

AGCTAGAGTC 1920 

TCCCTAAGTC 1980 

TTTTTAACAA 2 040 



20 



Seq ID NO: 101 Protein sequence: 
Protein Accession #: NP 000664 



11 



25 MGTAGKV I KC 
KFPVIVGHEA 
GVLADGTTRF 
GAAVKTGKVK 
ISPKDSTKPI 

3 0 LTYDPMLLFT 
LLNSGQSIRT 



KAAVLWEQKQ 
TGIVESIGEG 
TCKGKPVHHF 
PGSTCWFGL 
SEVLSEMTGN 
GRTWKGCVFG 
VLTF 



21 
I 

PFSIEEIEVA 
VTTVKPGDKV 
MNTSTFTEYT 
GGVGLiS V IMG 
NVGYTFEVIG 
GLKSRDDVPK 



31 
i 

PPKTKEVRIK 
IPLFLPQCRE 
WDESSVAKI 
CKSAGASRII 
HLETM I DAL A 
LVTEFLAKKF 



41 
1 

ILATGICRTD 
CNACRNPDGN 
DDAAPPEKVC 
GIDLNKDKFE 
SCHMNYGTSV 
DLDQLITHVL 



51 
i 

DHV I KGTMVS 60 

LCIRSDITGR 120 

LIGCGFSTGY 180 

KAMAVGATEC 240 

WGVPPSAKM 300 

PFKKISEGFE 360 



35 



40 



45 



50 



Seq ID NO: 102 DNA sequence 

Nucleic Acid Accession NM_006783.1 

Coding sequence: 1..786 



ATGGATTGGG 
GGGAAGGTGT 
CAGGAAGTGT 
AAAAATGTGT 
CTGATCTTCG 
GAAACCACTC 
ATTAAAAAGC 
TTTTTCCGAA 
TACCACCTGC 
TTTATTTCTA 
ATTTGCATGC 
AGATCAAAGA 
CAGAATGAAA 
AGCTAA 



11 
i 

GGACGCTGCA 
GGATCACAGT 
GGGGTGACGA 
GCTATGACCA 
TCTCCACCCC 
GCAAGTT C AG 
ACAAGGTTCG 
TCATCTTTGA 
CCTGGGTGTT 
GGCCAACAGA 
TGCTTAACGT 
GAGCACAGAC 
TGAATGAGCT 



21 
i 

CACTTTCATC 
CATCTTTATT 
GCAAGAGGAC 
CTTTTTCCCG 
AGCGCTGCTG 
GCGAGGAGAG 
GATAGAGGGG 
AGCAGCCTTT 
GAAATGTGGG 
GAAGACCGTG 
GGCAGAGTTG 
GCAAAAAAAT 
GATTTCAGAT 



31 
I 

GGGGGTGTCA 
TTCCGAGTCA 
TTCGTCTGCA 
GTGTCCCACA 
GTGGCCATGC 
AAGAGGAATG 
TCGCTGTGGT 
ATGTATGTGT 
ATTGACCCCT 
TTTACCATTT 
TGCTACCTGC 
CACCCCAATC 
AGTGGTCAAA 



41 
I 

ACAAACACTC 
TGATCCTAGT 
ACACACTGCA 
TCCGGCTGTG 
ATGTGGCCTA 
ATTTCAAAGA 
GGACGTACAC 
TTTACTTCCT 
GCCCCAACCT 
TTATGATTTC 
TGCTGAAAGT 
ATGCCCTAAA 
ATGCAATCAC 



51 

I 

CACCAGCATC 60 

GGTGGCTGCC 12 0 

ACCGGGATGC 180 

GGCCCTCCAG 240 

CTACAGGCAC 300 

CATAGAGGAC 360 

CAGCAGCATC 420 

TTACAATGGG 480 

TGTTGACTGC 540 

TGCGTCTGTG 600 

GTGTTTTAGG 660 

GGAGAGTAAG 720 

AGGTTTCCCA 780 



Seq ID NO: 103 Protein sequence: 
55 Protein Accession #: NP_006774.1 



60 



65 



70 



75 



80 



I 

MDWGTLHTFI 
KNVCYDHFFP 
IKKHKVRIEG 
FI SRPTBKTV 
QNEMNELISD 



11 21 31 41 51 

I I I I 1 

GGVNKHSTS I GKVWITVIFI FRVMILWAA QEVWGDEQED FVCNTLQPGC 

VSHIRLWALQ LIFVSTPALL VAMHVAYYRH ETTRKFRRGE KRNDFKD I ED 

SLWWTYTSSI FFRIIFEAAF MYVFYFLYNG YHLPWVLKCG IDPCPNLVDC 

FTIFMISASV I CMLLNVAEIi CYLLLKVCFR RSKRAQTQKN HPNHALKESK 

SGQNAITGFP S 



Seq ID NO: 104 DNA sequence 
Nucleic Acid Accession #: NM_020411 
Coding sequence: 86-526 



GGACCTGGGA 
AAGGCACGAG 
ACTGGGCGTC 
GGCGACTCGG 
ACAAACACAG 
GAACCAGCAG 
ACAGCTGAGA 
ACCGGGGATA 
ACACTGTAAA 
AAACAACGCA 
CAGCTTTCAC 



11 

I 

AGGAGCATAG 
GGAACCTCAC 
TTCCCATCGG 
GTCCCTGAGG 
AACCACACAG 
CTGAAAGTCG 
TCCCAGTGCG 
AATCTGGATT 
ATGCCAGAAG 
AGCTGGTTTT 
CAAAAAAAAA 



21 
I 

GACAGGGCAA 
TGCGCATGCT 
CCCCTTCGCC 
TCTGGATTCT 
CCAGTCCCAG 
GGATCCTACA 
CGACATGGAA 
TGGGTTCCGG 
CAGGTGAAGA 
ATATTAGATA 
AAAAAA 



31 

I 

GGCGGGATAA 
CCTTTGGTGC 
AGTGTGGGGA 
TTCTCCGCTA 
GAGCCCAGTA 
CCTGGGCAGC 
GGTGATCTGC 
CGTCAAGGTG 
GCAACCACAA 
TTTGACTTAA 



41 



GGAGGGGCAC 
CCACCTCAGT 
ACGCGGCGGA 
CTGAGACACG 
ATGGAGAGCC 
AGACAGAAGA 
AAGAGCTGCA 
AAGATAATAC 
GTTTAAATGA 
ACTATCT CAA 



51 
I 

CACAGCCCTT 
GCGCATGTTC 
GCTGTGAGCC 
GCGGACACAC 
CCAAAAAGAA 
AGATCAGGAT 
TCAGTCAAAC 
CTAAAGAGGA 
AGACAAGCTG 
TAAAGTTTTG 



60 
120 
180 
240 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 



Seq ID NO: 105 Protein sequence: 
85 Protein Accession #: NP 065144.1 



11 



21 



31 



41 



51 



229 



WO 02/086443 

t I I I I I 

MLLWCPPQCA CSLGVFPSAP SPVWGTRRSC EPATRVPEVW ILSPLLRHGG HTQTQNHTAS 
PRSPVMESPK KKNQQLKVGI LHLGSRQKKI RIQLRSQCAT WKVICKSCIS QTPGINLDLG 
SGVKVKIIPK EEHCKMPEAG EEQPQV 

Seq ID NO: 106 DNA sequence 
Nucleic Acid Accession #: J04129 
Coding sequence: 99-587 

1 11 21 31 41 51 

111)11 
CATCCCTCTG GCTCCAGAGC TCAGAGCCAC CCACAGCCGC AGCCATGCTG TGCCTCCTGC 

TCACCCTGGG CGTGGCCCTG GTCTGTGGTG TCCCGGCCAT GGACATCCCC CAGACCAAGC 

AGGACCTGGA GCTCCCAAAG TTGGCAGGGA CCTGGCACTC CATGGCCATG GCGACCAACA 

ACATCTCCCT CATGGCGACA CTGAAGGCCC CTCTGAGGGT CCACATCACC TCACTGTTGC 

CCACCCCCGA GGACAACCTG GAGAT CGTTC TGCACAGATG GGAGAACAAC AGCTGTGTTG 

AGAAGAAGGT CCTTGGAGAG AAGACTGGGA ATCCAAAGAA GTTCAAGATC AACTATACGG 

TGGCGAACGA GGCCACGCTG CTCGATACTG ACTACGACAA TTTCCTGTTT CTCTGCCTAC 

AGGACACCAC CACCCCCATC CAGAGCATGA TGTGCCAGTA CCTGG CCAGA GTCCTGGTGG 

AGGACGATGA GATCATGCAG GGATTCATCA GGGCTTTCAG GCCCCTGCCC AGGCAGCTAT 

GGTACTTGCT GGACTTGAAA CAGATGGAAG AGCCGTGCCG TTTCTAGCTC ACCTCCGCCT 

CCAGGAAGAC CAGACTCCCA CCCTTCCACA CCTCCAGAGC AGTGGGACTT CCTCCTGCCC 

TTTCAAAGAA TAACCACAGC TCAGAAGACG ATGACGTGGT CAT CTGTGT C GCCATCCCCT 

TCCTGCTGCA CACCTGCACC ATTGCCATGG GGAGGCTGCT CCCTGGGGGC AGAGTCTCTG 

GCAGAGGTTA TTAATAAACC CTTGGAGCAT G 



Seq ID NO: 107 Protein sequence: 
Protein Accession #: AAA60147 



1 ll 21 31 41 51 

l l l I I I 

MDIPQTKQDL ELPKLAGTWH SMAMATNNI S LMATLKAPLR VHITSLLPTP EDNLEIVLHR 
WENNSCVEKK VLGEKTGNPK KFKINYTVAN EATLLDTDYD NFLFLCLQDT TTPIQSMMCQ 
YLARVLVEDD EIMQGFIRAF RPLPRHLWYL LDLKQMEEPC RF 



Seq ID NO: 108 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 48-7 94 

1 11 21 31 41 51 

I i i I i i 

TCCCAGGCAG CAGTTAGCCC GCCGCCCGCC TGTGTGT CCC C AG AG CCATG GAGAGAGCCA 
GTCTGATCCA GAAGGCCAAG CTGGCAGAGC AGGCCGAACG CTATGAGGAC ATGGCAGCCT 
TCATGAAAGG CGCCGTGGAG AAGGGCGAGG AGCTCTCCTG CGAAGAGCGA AACCTGCTCT 
CAGTAGCCTA TAAGAACGTG GTGGGCGGCC AGAGGGCTGC CTGGAGGGTG CTGTCCAGTA 
TTGAGCAGAA AAGCAACGAG GAGGGCTCGG AGGAGAAGGG GCCCGAGGTG CGTGAGTACC 
GGGAGAAGGT GGAGACTGAG CTCCAGGGCG TGTGCGACAC CGTGCTGGGC CTG CTGGACA 
GCCACCTCAT CAAGGAGGCC GGGGACGCCG AGAGCCGGGT CTTCTACCTG AAGATGAAGG 
GTGACTACTA CCGCTACCTG GCCGAGGTGG CCACCGGTGA CGACAAGAAG CGCATCATTG 
ACTCAGCCCG GTCAGCCTAC CAGGAGGCCA TGGACATCAG CAAGAAGGAG ATGCCGCCCA 
CCAACCCCAT CCGCCTGGGC CTGGCCCTGA ACTTTTCCGT CTTCCACTAC GAGAT CGCCA 
ACAGCCCCGA GGAGGCCATC TCTCTGGCCA AGACCACTTT CGACGAGGCC ATGGCTGATC 
TGCACACCCT CAGCGAGGAC TCCTACAAAG ACAGCACCCT CATCATGCAG CTGCTGCGAG 
ACAACCTGAC ACTGTGGACG GCCGACAACG CCGGGGAAGA GGGGGGCGAG GCTCCCCAGG 
AGCCCCAGAG CTGAGTGTTG CCCGCCACCG CCCCGCCCTG CCCCCTCCAG TCCCCCACCC 
TGCCGAGAGG ACTAGTATGG GGTGGGAGGC CCCACCCTTC TCCCCTAGGC GCTGTTCTTG 
CTCCAAAGGG CTCCGTGGAG AGGGACTGGC AGAGCTGAGG CCACCTGGGG CTGGGGATCC 
CACTCTTCTT GCAGCTGTTG AGCGCACCTA ACCACTGGTC ATGCCCCCAC CCCTGCTCTC 
CGCACCCGCT TCCTCCCGAC CCCAGGACCA GGCTACTTCT CCCCTCCTCT TGCCTCCCTC 
CTGCCCCTGC TGCCTCTGAT CGTAGGAATT GAGGAGTGTC CCGCCTTGTG GCTGAGAACT 
GGACAGTGGC AGGGGCTGGA GATGGGTGTG TGTGTGTGTG TGTGTGTGTG TGTGTGTGTG 
CGCGCGCGCC AGTGCAAGAC CGAGATTGAG GGAAAGCATG TCTG CTGGGT GTGACCATGT 
TTCCTCTCAA TAAAGTTCCC CTGTGACACT C 



Seq ID NO: 109 Protein sequence: 
Protein Accession #: NP_006133.1 

1 11 21 31 41 51 

I I I I.I 1 

MERASLIQKA KLAEQAERYE DMAAFMKGAV EKGEELSCEE RNLLSVAYKN WGGQRAAWR 

VLSSIEQKSN EEGSEEKGPE VREYREKVET ELQGVCDTVL GLLDSHLIKE AGDAESRVFY 

LKMKGDYYRY LAEVATGDDK KRI IDSARSA YQEAMD I SKK EMPPTNPIRL GLALNFSVFH 

YEIANSPEEA ISLAKTTFDE AMADLHTLSE DSYKDSTIiIM QLLRDNLTLW TADNAGEEGG 
EAPQEPQS 



Seq ID NO: 110 DNA sequence 
Nucleic Acid Accession #: NM_000695 
Coding sequence: 407-1564 



1 11 21 31 41 51 

1 1 I I I I 

CACGAGTTGG TTTGGGAGCT GCCAGTCTCC TGGGAGGATC GCAGTCAGCA GAGCAGGGCT 

GAGGCCTGGG GGTAGGAGCA GAGCCTGCGC ATCTGGAGGC AGCATGT CCA AGAAAGGGAG 

TGGAGGTGCA GCGAAGGACC CAGGGGCAGA GCCCACGCTG GGGATGGACC CCTTCGAGGA 

CACACTGCGG CGGCTGCGTG AGGCCTTCAA CTGAGGGCGC ACGCGGCCGG CCGAGTTCCG 

GGCTGCGCAG CTCCAGGGCC TGGGCCACTT CCTTCAAGAA AACAAGCAGC TTCTGCGCGA 



230 



10 



15 



20 



25 



30 



35 



40 



WO 02/086443 

CGTGCTGGCC CAGGACCTGC 
TTGCCAGAAC GAGGTTGACT 
ACGGTCCACG AACCTGTTCA 
CCTGGTCCTC ATCATCGCAC 
GGGCACCCTC CCCGCAGGGA 
AGAGAAGGTC CTGGCTGAGG 
GCTGGGCGGA CCCCAGGAGA 
CACAGGGAGC CCTCGTGTGG 
TGTCACCCTG GAGCTGGGGG 
GACCGTGGCC AACCGCGTGG 
CCCTGACTAC GTCCTGTGCA 
CACCATCACC CGTTTCTATG 
CAACCAGAAA CAGTTCCAGC 
GGGCCAGAGC AACGAGAGCG 
GACGGAGCCT GTGATGCAGG 
GAGCGTGGAC GAGGCCATCA 
CTTCTCCAAC AGCAGACAGG 
TGGAGGCAAT GAGGGCTTCA 
CCACAGTGGG ATGGGCCGGT 
CACCTGCCTG CTCGCCCCCT 
TACCGACTGG AACCAGCAGC 
GTGAGCGTCC CACCCGCCTC 
GCTTATGCTC CCAACTCACA 
TGGAGCTGTC ACATGACTGC 
TCTGGGGGAC GCTGCTCGAG 
CACCCCACCC TCCCCAATTC 
CACAGGGGCA GTGTCACCCT 
GAACGGTTGA GAGCGTGGAG 
TTCCACCTCT GCCCCATCCC 
CCCACACTGG TCTCTGCACC 
AGCTCCATCC ACTGGGAAAA 
CTGGGGGCAA GTCCCTTGAC 
CCAAAATGGA GTCACTTATG 
CCCTCACACA CACATGCCCG 
AGACACAGGG CGTATGGAAA 
GATGCTTACC TACCACGGCC 
TGTGACTTAC AAACCTTGTT 
CCCTTGGCTG TGGCCCTCTG 
GGAATCCTCT GCTCCTCCCA 



PCT/US02/12476 



ATAAGCCAGC 
ACGCTCT CAA 
TGAAGCTGGA 
CCTGGAACTA 
ATTGCGTGGT 
TGCTGCCCCA 
CAGGGCAGCT 
GCAAGATTGT 
GCAAGAACCC 
CCTGGTTCTG 
GCCCCGAGAT 
GCGACGACCC 
GGCTGCGGGC 
ATCGCTACAT 
AGGAGATCTT 
AGTT CATCAA 
TTGTGAACCA 
CCTACATATC 
ACCACGGCAA 
CCGGCCTGGA 
TGTTACGCTG 
CAACGGGTCA 
TTGTTCCTCC 
ATCCTGCCTG 
AGAGGCGGAG 
CAGCCCTTTG 
GGAAAATACA 
CCCTCCAGGC 
AACTGCACCA 
ACCCCTCTGG 
CTGGGGTTTG 
TTCTCTGAGC 
CCAAACTCTA 
TAACAGGATT 
AGCACGTCCT 
GTCTCCACCA 
TAAAAGCTGC 
TGTATGCCTG 
AATAAATTCA 



TTTCGAGGCA 
GAACCTTCAG 
CTCGGTCTTC 
CCCATTGAAC 
GCTGAAGCCG 
GTACCTGGAC 
GCTAGAGCAC 
CATGACTGCT 
CTGCTACGTG 
CTACTTCAAT 
GCAGGAGAGG 
CCAGAGCTCC 
ATTGCTGGGC 
CGCCCCCACG 
CGGGCCCATC 
CCGGCAGGAG 
GATGCTGGAG 
TCTGCTGTCC 
GTTCACCTTC 
GAAATTAAAG 
GGGCATGGGC 
CACAGAGAAA 
AGACCGCAGG 
CCAGGGCTGC 
AGGCCGCAGA 
CCCTCTCGGT 
GTGCCCTGCC 
CTTTGCTCTC 
GCACTGCCTC 
TTCACACCGC 
CATC ACT CCA 
CTCAGTTTCC 
ATAAAATGGA 
TATCACCAAG 
CAAAGACTGT 
GAAAACCATC 
TTACATGGAC 
GGATCCTTCC 
TCTGTTC 



GACATATCTG 
GCCTGGATGA 
ATCTGGAAGG 
CTGACCCTGG 
TCAGAAATCA 
CAGAGCTGCT 
AAGTTGGACT 
GCCACCAAGC 
GACGACAACT 
GCCGGCCAGA 
CTGCTGCCCG 
CCAAACCTGG 
TGCGGCCGCG 
GTGCTGGTGG 
CTGCCCATCG 
AAGCCCCTGG 
CGGACCAGCA 
GTGCCATTCG 
GACACCTTCT 
GAGATCCGCT 
TCCCAGAGCT 
CCTGAGTCTA 
CTCCCCCAGC 
AAAGCAAGGT 
ACATGCCAGG 
CAGGGTTGGC 
TTCTTAGGGG 
CCCTCTAGGC 
CCCCAGGGAT 
ACCCTGCACT 
CTGCACAGTG 
TTATGTGAAA 
GTCGGGGGGG 
ACACGCCTGC 
AGTATTCCAG 
GCCAACTCCT 
TTCTGTCCTT 
AAG C ACT CAT 



AGCT CATCCT 3 60 

AGGATGAACC 42 0 

AACCCTTTGG 480 

TGCTCCTGGT 540 

GCCAGGGCAC 600 

TTGCCGTGGT 660 

ACATCTTCTT 72 0 

ACCTGACGCC 780 

GCGACCCCCA 840 

CCTGCGTGGC 900 

CCCTGCAGAG 960 

G C CG CAT CAT 1020 

TGGCCATTGG 1080 

ACGTGCAGGA 1140 

TGAACGTGCA 12 00 

CCCTGTACGC 12 60 

GCGGCAGCTT 1320 

GGGGAGTCGG 1380 

CCCACCACCG 1440 

ACCCACCCTA 1500 

GCACCCTCCT 1560 

GCCATGAGGG 162 0 

CTCAGGTTGC 1680 

CTTGCTTCTA 1740 

TGTCCTCACT 180 0 

CAGGCCCAGT 1860 

CATCAGCCCT 1920 

ACACGCGCAC 1980 

CCTCTCACAT 2 040 

CACCCACAGC 210 0 

TTAGTGGGAC 2160 

GTTGCTGGAA 2220 

CACATAGAAG 2280 

ATGTAAGACC 2 340 

ATGAGCTGCA 2400 

GCGATCAGCT 2460 

TAAAACGTTC 252 0 

AGCCCAGATA 2580 



Seq ID NO: 111 Protein sequence: 
Protein Accession #: NP 000686 



45 



50 



55 



60 



65 



70 



75 



80 



85 



MKDEPRSTNL 
I SQGTEKVLA 
KHLTPVTLEL 
PALQSTITRF 
VDVQETEPVM 
SSGSFGGNEG 
RYPPYTDWNQ 



11 
I 

FMKLDSVFIW 
EVLPQYLDQS 
GGKNPCYVDD 
YGDDPQSSPN 
QEEIFGPILP 
FTYISLLSVP 
QLLRWGMGSQ 



21 



KEPFGLVLI I 
CFAWLGGPQ 
NCDPQTVANR 
LGRI INQKQF 
IVNVQSVDEA 
FGGVGH SGMG 
SCTLL 



31 
I 

APWNYPLNLT 
ETGQLLEHKL 
VAWFCYFNAG 
QRIiRALLGCG 
IKFINRQEKP 
RYHGKFTFDT 



41 



LVLLVGTLPA 
DYIFFTGSPR 
QTCVAPDYVL 
RVAIGGQSNE 
LALYAFSNSR 
FSHHRTCLLA 



51 
I 

GNCWLKPSE 
VGKIVMTAAT 
CSPEMQERLL 
SDRYIAPTVL 
QWNQMLERT 
PSGLEKLKEI 



Seq ID NO: 112 DNA sequence 
Nucleic Acid Accession ft: NM_004456 
Coding sequence: 58-22 98 



11 



21 



GAATTCCGGG 
GGCCAGACTG 
GAGTACATGC 
TTT AGTT CCA 
CAGCGAAGGA 
GAGTGTTCGG 
AATGCAGTTG 
GTGGAAGATG 
GATGGT ACT T 
GAATGTGGGT 
AATGATGATG 
GATCTGGAGG 
AAAATTTTGG 
GAAAAATATA 
CCCAACATAG 
CATACGCTTT 
ACACCCAACA 
CCACAGTGTT 
CGGATAAAGA 
' AGTAGCAGGC 
AGGGAAGCAG 
GATGAAACTT 
CCAAATATTG 
GTCCTCATTG 
ACATGTAGAC 
GCTGAGGATG 
CACTGCAGAA 



CGACGCGCGG 
GGAAGAAATC 
GACTGAGACA 
AT CGTCAGAA 
TACAGCCTGT 
TGACCAGTGA 
CTT CAGTACC 
AAACTGTTTT 
TCATTGAAGA 
TTATAAATGA 
ACGATGATGA 
ATCACCGAGA 
AGGCCATTTC 
AAG AAC T CA C 
ATGGACCAAA 
TCTGTAGGCG 
CTTATAAGCG 
ACCAGCATTT 
CCCCACCAAA 
CCAGCACCCC 
GGACTGAAAC 
CGAGCTCCTC 
AACCTCCTGA 
GCACTTACTA 
AGGTGTATGA 
TGGATACTCC 
AGATACAGCT 



GAACAACGCG 
TGAGAAGGGA 
GCTCAAGAGG 
AATTTTGGAA 
GCACATCCTG 
CTTGGATTTT 
CATAATGTAT 
ACATAACATT 
ACTAATAAAA 
TGAAATTTTT 
TGATGGAGAC 
TGATAAAGAA 
CTCAATGTTT 
CGAACAGCAG 
TGCTAAATCT 
ATGTTTTAAA 
GAAGAACACA 
GGAGGGAGCA 
ACGTGCAGGA 
CACCATTAAT 
GGGGGGAGAG 
TGAAGCAAAT 
GAATGTGGAG 
TGACAATTTC 
GTTTAGAGTC 
TCCAAGGAAA 
GAAAAAGGAC 



31 

I 

AGTCGGCGCG 
CCAGTTTGTT 
TTCAGACGAG 
AGAACGGAAA 
ACTTCTGTGA 
CCAACACAAG 
TCTTGGTCTC 
CCTTATATGG 
AATTATGATG 
GTGGAGTTGG 
GATCCTGAAG 
AGCCGCCCAC 
CCAGATAAGG 
CTCCCAGGCG 
GTTCAGAGAG 
TATGACTGCT 
GAAACAGCTC 
AAGGAGTTTG 
GGCCGCAGAA 
GTGCTGGAAT 
AACAATGATA 
TCTCGGTGTC 
TGGAGTGGTG 
TGTGCCATTG 
AAAGAAT CTA 
AAGAAGAGGA 
GGCTCCTCTA 



41 
i 

CGGGACGAAG 
GGCGGAAGCG 
CTGATGAAGT 
TCTTAAACCA 
GCTCATTGCG 
TCATCCCATT 
CCCTACAGCA 
GAGATGAAGT 
GGAAAGTACA 
TGAATGCCCT 
AAAGAGAAGA 
CTCGGAAATT 
GCACAGCAGA 
CACTTCCTCC 
AGCAAAGCTT 
TCCTACATCC 
TAGACAACAA 
CTGCTGCTCT 
GAGGACGGCT 
CAAAGGATAC 
AAGAAGAAGA 
AAACACCAAT 
CTGAAGCCTC 
CTAGGTTAAT 
GCAT CATAGC 
AACACCGGTT 
ACCATGTTTA 



51 
I 

AATAATCATG 
TGTAAAATCA 
AAAGAGTATG 
AGAATGGAAA 
CGGGACTAGG 
AAAGACTCTG 
GAATTTTATG 
TTTAGATCAG 
CGGGGATAGA 
TGGTCAATAT 
AAAGCAGAAA 
TCCTTCTGAT 
AGAACTAAAG 
TGAATGTACC 
ACACTCCTTT 
TTTTCATGCA 
ACCTTGTGGA 
CACCGCTGAG 
TCCCAATAAC 
AGACAGTGAT 
AGAGAAGAAA 
AAAGATGAAG 
AATGTTTAGA 
TGGGACCAAA 
TCCAGCTCCC 
GTGGGCTGCA 
CAACTATCAA 



60 
12 0 
180 
240 
300 
360 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 



231 



10 



15 



WO 02/086443 

CCCTGTGATC ATCCACGGCA 
TTTTGTGAAA AGTTTTGTCA 
TGCAAAGCAC AGTGCAACAC 
CCTGACCTCT GTCTTACTTG 
AAGAACTGCA GTATTCAGCG 
GCAGGCTGGG GGATTTTTAT 
TGTGGAGAGA TTATTTCTCA 
ATGTGCAGCT TTCTGTTCAA 
AACAAAATTC GTTTTGCAAA 
GTTAACGGTG ATCACAGGAT 
CTGTTTGTTG ATTACAGATA 
GAAATGGAAA TCCCTTGACA 
CTTCAGGAAC CTCGAGTACT 
AATTTGCAAA GTACTGTAAG 
GCCTTCTCAC CAGCTGCAAA 
TACATTTTTC AACTTTGAAT 



PCT/US02/12476 



GCCTTGTGAC 
ATGTAGTTCA 
CAAGCAGTGC 
TGGAGCCGCT 
GGGCTCCAAA 
CAAAGATCCT 
AGATGAAGCT 
CTTGAACAAT 
TCATTCGGTA 
AGGTATTTTT 
CAGCCAGGCT 
TCTGCTACCT 
GTGGGCAATT 
AATAATTTAT 
GTGTTTTGTA 
AAAGAATACT 



AGTTCGTGCC 
GAGTGT CAAA 
CCGTGCTACC 
GACCATTGGG 
AAGCATCTAT 
GTGCAGAAAA 
GACAGAAGAG 
GATTTTGTGG 
AATCCAAACT 
GCCAAGAGAG 
GATGCCCTGA 
CCTCCCCCTC 
TAGAAAAAGA 
AGTAATGAGT 
CCAGTGAATT 
TGAACTTGAA 



CTTGTGTGAT 
ACCGCTTTCC 
TGGCTGTCCG 
ACAGTAAAAA 
TGCTGGCACC 
ATGAATTCAT 
GGAAAGTGTA 
TGGATGCAAC 
GCTATGCAAA 
CCATCCAGAC 
AGTATGTCGG 
CTCTGAAACA 
ACATGCAGTT 
TTAAAAATCA 
TTTGCAATAA 
AAAAAAAAAA 



AGCACAAAAT 1680 

GGGATGCCGC 1740 

AGAGTGTGAC 180 0 

TGTGTCCTGC 1860 

ATCTGACGTG 192 0 

CTCAGAATAC 1980 

TGATAAATAC 2 040 

CCGCAAGGGT 2100 

AGTTATGATG 2160 

TGGCGAAGAG 2220 

CATCGAAAGA 22 80 

GCTGCCTTAG 2340 

TGAAATTCTG 240 0 

ACTTTTTATT 2460 

TGCAGTATGG 2520 
AAAAAA 



Seq ID NO: 113 Protein sequence: 
20 Protein Accession #: NP 004447 



25 



30 



35 



MGQTGKKSEK 
KQRRIQPVHI 
MVEDETVLHN 
YNDDDDDDDG 
KEKYKELTEQ 
ATPNTYKRKN 
NSSRPSTPTI 
KPNIEPPENV 
PAEDVDTPPR 
NFCEKFCQCS 
CKNCSIQRGS 
YMCSFLFNLN 
ELFVDYRYSQ 



11 

I 

GPVCWRKRVK 
LTSVSSLRGT 
IPYMGDEVLD 
DDPEEREEKQ 
QLPGALPPEC 
TETALDNKPC 
NVLESKDTDS 
EWSGAEASMF 
KKKRKHRLWA 
SECQNRFPGC 
KKHLLLAPSD 
NDFWDATRK 
ADALKYVGIE 



21 
I 

SEYMRLRQLK 
RECSVTSDLD 
QDGTFIEELI 
KDLEDHRDDK 
TPNIDGPNAK 
GPQCYQHLEG 
DREAGTETGG 
RVLIGTYYDN 
AHCRKIQLKK 
RCKAQCNTKQ 
VAGWGIFIKD 
GNKIRFANHS 
REMEIP 



31 
I 

RFRRADEVKS 
FPTQVIPLKT 
KNYDGKVHGD 
ESRPPRKFPS 
SVQREQSLHS 
AKE FAAALTA 
ENNDKEEEEK 
FCAIARLIGT 
DGSSNHVYNY 
CPCYLAVREC 
PVQKNEFISE 
VNPNCYAKVM 



41 



MFSSNRQKIL 
LNAVASVPIM 
RECGFINDEI 
DKILEAISSM 
FHTLFCRRCF 
ERIKTPPKRP 
KDETSSSSEA 
KTCRQVYEFR 
QPCDHPRQPC 
DPDLCLTCGA 
YCGEIISQDE 
MVNGDHR I G I 



51 
I 

ERTEILNQEW 60 

YSWSPLQQNF 12 0 

FVELVNALGQ 180 

FPDKGTAEEL 240 

KYDCFLHPFH 300 

GGRRRGRLPN 360 

NSRCQTPIKM 42 0 

VKESSIIAPA 480 

DSSCPCVIAQ 540 

ADHWDSKNVS 600 

ADRRGKVYDK 660 

FAKRAIQTGE 720 



40 



45 



50 



55 



Seq ID NO: 114 DNA sequence 
Nucleic Acid Accession #: NM_001827 
Coding sequence: 96-335 



AGTCTCCGGC 
CGCTCTCGTT 
CGGACAAGTA 
CCAAACAAGT 
AACAGAGTCT 
TTAGACGAC C 
TTTTCAAATT 
ACAAATCTTT 
AAATGCAACT 
TTTCTCTTAA 
TAT GT TG CAT 



11 
I 

GAGTTGTTGC 
TCATTTTCTG 
CTTCGACGAA 
ACCTAAAACT 
AGGCTGGGTT 
TCTTCCAAAA 
TAATGTATAT 
CATCCATACC 
GCAAGTAGGT 
GTGCCTGTTT 
TTAAAAAAAA 



21 
I 

CTGGGCTGGA 
CAGCGCGCCA 
CACTACGAGT 
CATCTGATGT 
CAT TACATGA 
GATCAACAAA 
GTGTATATAA 
TGTGCATGAG 
TACTGTAAGA 
GAGTTTACTG 
AAAAAAA 



31 
I 

CGTGGTT TTG 
CGAGGATGGC 
ACCGGCATGT 
CTGAAGAGGA 
TTCATGAGCC 
AATGAAGTTT 
GGTAGTATTC 
CTGTATTCTT 
TGTTTAAGAT 
AAACAGTTTA 



41 
I 

TCTGCTGCGC 
CCACAAGCAG 
TATGTTACCC 
GTGGAGGAGA 
AGAACCACAT 
ATCTGGGGAT 
AGTGAATACT 
CACAGCAACA 
AAAAGTTCTT 
CTTTTGTTCA 



51 
I 

CCGCTCTTCG 60 

ATCTACTACT 12 0 

AGAGAACTTT 180 

CTTGGTGTCC 240 

ATTCTTCTCT 300 

CGTCAAATCT 360 

TGAGAAATGT 420 

GAGCTCAGTT 480 

CCAGTCAGTT 540 

ATAAAGTTTG 600 



Seq ID NO: 115 Protein sequence: 
Protein Accession #: NP 001818 



1 11 21 31 41 51 

60 | i | | I I 

MAHKQIYYSD KYFDEHYEYR HVMLPRELSK QVPKTHLMSE EEWRRLGVQQ SLGWVHYMIH 
EPEPHILLFR RPLPKDQQK 



60 



Seq ID NO: 116 DNA sequence 
65 Nucleic Acid Accession #: CAT cluster 



70 



75 



80 



85 



TCAGACCTCA 
GCATCTGGAC 
AGAGGTGTGT 
GCAGCCAACA 
AAGG AC TG AT 
CCTTGGAAGG 
TCAAGAATTC 
AGTGTGG GAG 
CCCATCTCTA 
CCTGTAGTTC 
AGGCTGCAAT 
CCTGTCTCAA 
TTTGAGGTGC 
CCTGAAGGAG 
GACAGACCTT 
CTCTTCCCCC 
CCGCCTCCCA 
CAGCCGGATA 
TCCTGCTCCG 



11 

1 

TGAGTCACTT 
CCTTGGTGCT 
TCCAGGGAAA 
GAGTTCAAAA 
CCACATTCCC 
ACCTGGCTCA 
TTTGCTGAGC 
GATCTCTTGA 
AAATAATAAT 
CAGCTACCCA 
GAACTGTGAT 
ATAATAATAA 
CATTTGGGTA 
CAGAGGGATG 
GTCCTTCTTC 
TCCCTGTCCC 
TGTCTGCTGT 
CAGAGTGAAT 
TGTAAAGAGG 



21 



GGACTCTTGA 
ATCGACGAAG 
GCCCCTATCT 
TGCAGGCTTG 
ACCAGGAAGT 
GGCTGGACCA 
ATGGTGCCTC 
GCCCAGGAGT 
AATAATAAAA 
GGAGGCTGAG 
TACCCCACTG 
TAATAATAAT 
GAAAGAAAAG 
CATCGCTGGA 
CTTGTGGAAA 
AGGGAACCAA 
GCCTTTGTAC 
AGTTAACCAC 
CCAGTGTTTG 



31 
I 

GCCACCTCTG 
CTTGGGTGGG 
CT CTGCAGAG 
GAAAGTACAG 
TTAGCAGAAC 
CCTCTTGAGA 
ATGCCTATAA 
TCAAGACTAG 
TAAAAAATTA 
GCAAGAGGAT 
CACTCCAGCC 
CTTATTTTGG 
ACGTTTACAC 
GGTGACCTAC 
GTGTTTCCTC 
AGGGCTTTCT 
TCAGCAATTC 
ACTTAGGTCA 
TGTGTTGCAA 



41 



GGGGTGGAGT 
GCTCTTAGCT 
GTCAAGTGAA 
GGGGCTCTGT 
CCCCGCGTGC 
GGGAGGAGCT 
TACCAACACT 
CCTGGGCAAC 
GCAGGGCATG 
GGCTGGAGCC 
TGGGCAAAAG 
AGAATAAAGA 
CGAGAAATAG 
AGTTGAAGAA 
TGCTGCTACT 
ACCACACCCT 
TTGTTTGCTC 
AATAGGATCT 
GCAGCCTTGG 



51 
I 

CTCTCTCCTG 60 

GCTATGTGCA 120 

AGCGACGGCC 180 

GGAGGATGGG 240 

CAACTGGACC 300 

CTGGATTTGA 360 

TTGGGAGGCC 420 

ACAGAGAGAA 480 

GTGGCATGTG 540 

TGGGATGTTG 600 

AGCGAGAGAA 660 

GACCTCTGGA 720 

TCTGTGTTGC 780 

GACTCATTAT 840 

GCTCATGAGA 900 

TTCTTGCCCC 960 

CATTATCTTC 1020 

AAATTTTTGT 10 80 

AATAGTAACT 1140 



232 



10 



WO 02/086443 

CTTCTCATTT GTTTGGGATC 
AGTTCATCAG GCTCTCGGAC 
GTGAAGGCTC GTGTTCTCCA 
TTGGAAGGGC AAAAAATGAA 
ACAGTCTGCT GTGAAGACCT 
GCTTCATGAG AGACTGACAG 
CAGTGTGTGC TGATGACACA 
ACTCTGTAGC CAACATACAC 
CTTGTCCAAA TGCAGAGTCA 
TGGCTTTCTT TTTGCAAAAA 
AAACAAAAAA 



TGGCCACCAA 
CTTAGGGCTG 
TCCTCAACTT 
CACTGTCGTT 
TCT CTCAAGT 
CTATCAGGGG 
TACACACCTG 
ATGATTTAAA 
GAGCTATTTG 
TAATTAAAGT 



GTTCCAGAAT 
TTGGAGAAGG 
TCTTTGCTTC 
CATTGCAGCC 
GGCATTTGGG 
TTGTGGCACT 
ACAATAGCTT 
ACCCTTTCTA 
TACTTCATTA 
TTTTGTATGT 



GATACACGGA 
CTTCAGCAGC 
GATCATACAC 
GTGTTTTGTG 
AGTCCATGCC 
TAGTGAGGAC 
GAGTCTTCTC 
AATATCTATC 
TTATTTCCAA 
TGCAAAAAAA 



TCAGTGCAGA 1200 

AGAACTGATG 12 60 

AAGAATACAT 1320 

ACACAGATGC 1380 

AGATCATGGT 1440 

TCTCCTCCCC 150 0 

TGTTCCTTTT 1560 

ATGGTTCATC 162 0 

GGCGAATAGT 1680 

AAAAAAAAAA 1740 



PCT/US02/12476 



15 



Seq ID NO: 117 DNA sequence 

Nucleic Acid Accession #: BC012178.1 

Coding sequence: 204-2285 



20 



25 



30 



35 



40 



45 



50 



55 



CTTCTCTCCC 
TGGCGGCTGG 
GCCCGCGGCG 
CCGCGGCTCC 
CTGGAGGAGA 
CTGGTGCTCA 
AAATTTT CCC 
TCATCTCTGG 
TATTCACTAT 
TATTTGGAGG 
TGGATAATAC 
ATGGAGATAG 
TAGTAGCAGG 
TTGGCCTTAC 
GCAGTGGAAC 
GAGTAGGCAC 
CAGCTTTGCT 
GCTTTATGAG 
AGGT CAAAGT 
CAGATGAAGA 
CTGAAGAGAA 
GAGAAATGAA 
TAATTGAAAG 
ATGACACAGA 
ATTTTCATAA 
TTTCCAGGCA 
C T TAT AT T TG 
CTGCAAGTGT 
AGG AT CAGG A 
CAATTAAAAC 
CCAGTAAAGA 
TGTGTCACAA 
CAGATGTTAC 
TTGAGGCCCA 
TGATTTTGAC 
GAT CTGTGGT 
CTGGCAATGA 
CTGGTATTTC 
AGTAATAAAC 



11 

I 

GCGGCGCTGG 
CTCCTCTCCG 
CCGACCCTTC 
GGCCCTGGCC 
CCTTAAGGAT 
GTACGGGAAA 
CTTGGAAACA 
AGGACCTAAT 
TGGCAAGCCT 
TACTGTGCAC 
ATGTTCATTA 
TGTAGACAAA 
CATAGCAAAT 
AGAAAATGGA 
CTTCACCGTG 
GTCAAAAGTT 
AAATCGTGCT 
AAAACGAGAA 
GATAAATGCT 
TAGAACCCCA 
AAGAAAAATC 
CTTGAAACCA 
TGCATCCCTT 
GCTCATCAGA 
AGATGAAGTG 
TCCATTTCGA 
TAAGGACTTT 
TAAAAAGCCA 
GAAGCTGATG 
TGTAGGTGTG 
TGAACCTGAC 
CGTTAACAGA 
TCCCACTTTC 
TAACATTCTC 
ACCATTACAT 
TATTCGAACC 
GAT CCCTGTA 
TCGAATTATG 
TTCTTGTTCT 



21 
I 

GGCCCGCGCT 
CTGCCGGCTG 
CGGCACCCTC 
CCGATGGCTC 
GGCCACCACC 
GT CAT AGACC 
CCAGCATTTG 
TCTGTGTATG 
GTTCTTGGAA 
AAAAAAAGTG 
TTCAGGGGCC 
GTAGCTGATG 
GAATCTAAAA 
AAAGTAATAC 
CAGAACAGAG 
TTGGTTTTAC 
TTGAACCAAG 
AGCCAGTCTG 
GCTCATTCTT 
CGGAAAAGAA 
ATTGGGGATA 
GAGGAGGTTT 
GT TGCAAGTG 
AAGTTGAGAG 
AGAATTTTGG 
GGTCCTGGCC 
CCTGAAACCA 
CATACCCTAT 
CAAATTACCA 
CAGGGTGACT 
TGGGAATCAC 
GTTGTTTATA 
TTGACAACAG 
AGGGAGTCTG 
TTTGATCGGG 
TTTATTACTA 
GAGGTGGTAT 
TATGACTTAA 
ATTAAAA 



31 



CCGCTGCTGT 
CTCCTCGACC 
CCGCCCCGTC 
TGTGCAACGG 
ACTATGAAGG 
GAAGAGTGAG 
CTATAAAGGA 
CTGAAGATGC 
TTTGCTATGG 
TCAGAGAAGA 
TTCAGAAGGA 
GATTCAAGGT 
AGTTATATGG 
TGAAGAATTT 
AACTTGAGTG 
TCAGTGGTGG 
AACAAGTCAT 
TTGAAGAGGC 
TCTACAATGG 
TTAGCAAAAC 
CTTTTGTTAA 
TCCTTGCCCA 
GCAAAGCTGA 
AGGAGGGAAA 
GCAGAGAACT 
TGGCAATCAG 
ACAATATTTT 
TACAGAGAGT 
GTCTGCATTC 
GTCGTTCCTA 
TTATTTTTCT 
TATTTGGCCC 
GGGTGCTCAG 
GGTATGCTGG 
ACCCACTTCA 
GTGACTT CAT 
TAAAGATGGT 
CATCAAAGCC 



41 
I 

TGCTCCATTC 
AGGCCTCCTT 
TCGTACTGTC 
AGACT CCAAG 
AGCTGTTGTC 
GGAACTGTTC 
ACAAGGATTC 
TCCCTGGTTT 
TATGCAGATG 
TGGAGTTTTC 
AGAAGTTGTT 
TGTGGCACGT 
AGCACAGTTC 
CCTTTATGAT 
TATTCGAGAG 
AGTAGACTCA 
TGCTGTGCAC 
CCTCAAAAAG 
AACAACAACC 
GTTAAATATG 
GATTGCCAAT 
AGGTACTTTA 
ACTCATCAAA 
AGTAATAGAA 
TGGACTTCCA 
AGTAATATGT 
GAAAATAGTA 
CAAAGCCTGC 
ACTGAATGCC 
CAGTTACGTG 
GGCTAGGCTT 
ACCAGTTAAA 
TACTTTACGC 
GAAAATCAGC 
AAAGCAGCCT 
GACTGGTATA 
CACTGAGATT 
CCCAGGAACT 



51 
I 

GGCGCTTTTC 60 

CTCAACCTCA 12 0 

GCCGTCACCG 18 0 

CTGGAGAATG 240 

ATTCTGGATG 3 00 

GTGCAGTCTG 3 60 

CGTGCTATTA 42 0 

GAT CCAGCAA 480 

ATGAATAAGG 540 

AACATTAGTG 600 

TTGCTTACAC 660 

TCTGGAAACA 720 

CACCCTGAAG 780 

ATAGCTGGAT 840 

ATCAAAGAGA 900 

ACAGTTTGTA 960 

ATTGATAATG 1020 

CTTGGAATTC 10 80 

CTACCAATAT 1140 

ACCACAAGTC 1200 

GAAGTAATTG 12 60 

CGGCCTGATC 1320 

ACCCATCACA 13 80 

CCTCTGAAAG 1440 

GAAGAGTTAG 15 00 

GCTGAAGAAC 1560 

GCTGATTTTT 162 0 

ACAACAGAAG 1680 

TTCTTGCTGC 174 0 

TGTGGAATCT 18 00 

ATACCTCGCA 18 60 

GAACCTCCTA 192 0 

CAAGCTGATT 1980 

CAGATGCCGG 2 040 

TCATGCCAGA 2100 

CCTGCAACAC 2160 

AAGAAGATTC 222 0 

ACTGAGTGGG 22 8 0 



60 Seq ID NO: 118 Protein sequence: 
Protein Accession #: AAH12178.1 



65 



70 



75 



MALCNGDSKIi 
APAIKEQGFR 
KSVREDGVFN 
SKKLYGAQFH 
VLLSGGVDST 
HSFYNGTTTL 
EVFLAQGTLR 
ILGRELGLPE 
TLLQRVKACT 
ESLIFLARLI 
ESGYAGKISQ 
WIiKMVTEIK 



11 
I 

ENAGGDLKDG 
AIIISGGPNS 
ISVDNTCSLF 
PEVGLTENGK 
VCTALLNRAL 
PISDEDRTPR 
PDLIESASLV 
ELVSRHPFPG 
TEEDQEKLMQ 
PRMCHNVNRV 
MPVILTPLHF 
KIPGISRIMY 



21 



HHH YEGAW I 
VYAEDAPWFD 
RGLQKEEWL 
VILKNFLYDI 
NQEQVIAVHI 
KRISKTLNMT 
ASGKAELIKT 
PGLAIRVICA 
ITSLHSLNAF 
VYIFGPPVKE 
DRDPLQKQPS 
DLTSKPPGTT 



31 
I 

LDAGAQYGKV 
PAIFTIGKPV 
LTHGDSVDKV 
AGCSGTFTVQ 
DNGFMRKRES 
TSPEEKRKI I 
HHNDTELIRK 
EEPYICKDFP 
LLP I KTVGVQ 
PPTDVTPTFL 
CQRSWIRTF 
EWE 



41 
I 

IDRRVRELFV 
LGI CYGMQMM 
ADGFKWARS 
NRELECIREI 
QSVEEALKKL 
GDTFVKIANE 
LREEGKVIEP 
ETNNILKIVA 
GDCRSYSYVC 
TTGVLSTLRQ 
ITSDFMTGIP 



51 
I 

QSEIFPLETP 60 

NKVFGGTVHK 120 

GNIVAGIANE 180 

KERVGTSKVL 240 

GIQVKVINAA 3 00 

V I GEMNLKPE 3 60 

LKDFHKDEVR 42 0 

DFSASVKKPH 48 0 

GISSKDEPDW 540 

ADFEAHNILrR 600 

ATPGNEIPVE 660 



Seq ID NO: 119 DNA sequence 
Nucleic Acid Accession #: NM_006500.1 
oO Coding sequence: 27.. 1967 

1 ll 21 31 41 51 

l l l l I I 

ACTTGCGTCT CGCCCTCCGG CCAAGCATGG GGCTTCCCAG GCTGGTCTGC GCCTTCTTGC 60 

85 TCGCCGCCTG CTGCTGCTGT CCTCGCGTCG CGGGTGTGCC CGGAGAGGCT GAGCAG CCTG 120 

CGCCTGAGCT GGTGGAGGTG GAAGTGGGCA GCACAGCCCT TCTGAAGTGC GGCCTCTCCC 180 

AGTCCCAAGG CAACCTCAGC CATGTCGACT GGTTTTCTGT C CACAAGG AG AAGCGGACGC 240 



233 



WO 02/086443 

TCATCTTCCG TGTGCGCCAG 
TCAGCCTCCA GGACAGAGGG 
GCATCTTCTT GTGCCAGGGC 
TCTACAAAGC TCCGGAGGAG 
5 GTAAGGAGCC TGAGGAGGTC 

TCATCTGGTA CAAGAATGGC 
CGTCCCAGAC TGTGGAGTCG 
TGGTTAAAGA AGACAAAGAT 
GGAACCACAT GAAGGAGTCC 

10 TGTGGCTGGA AGTGGAGCCC 

GTTTGGCTGA TGGCAACCCT 
GGGAGGCAGA GGAAGAGACA 
AGGAACACAG TGGGCGCTAT 
TGAGTGAACC ACAGGAACTA 

15 CCCCTGAGAG ACAGGAAGGC 

ACCTCGAGTT CCAGTGGCTG 
TTCAGTTGCA TGACCTGAAA 
CCAGCATACC CGGCCTGAAC 
GGATGGCATT CAAGGAGAGG 

20 GTGAAGCGTC AGGGCACCCC 

AACAAGACCA AGAT CCACAG 
TGTTGGAGAC AGGTGTTGAA 
TCTTCCTGGA GCTGGTCAAT 
TCAGCACTTC CACTGCCAGT 

25 TGCCGGAGCC GGAGAGCCGG 

TGGCGGTGCT GGGCGCTGTC 
GCTCAGGGAA GCAGGAGATC 
TTAAGTCAGA TAAGCTCCCA 
GGGCTCCGGG AGACCAGGGA 

30 CAGCTCCCTT CCCTGCCTGG 

CCTCCAAAGG GACTAGAGAG 
GGCCACTGGG TTAGGACCTG 
GTCCACCACC ATCTCCTCCA 
CCGAGCGGGT AGGAGAGTTT 

35 AAATACCTGG CTCCTGCCAG 

CAAAGGCTGG CTTCCACCAT 
GCCTGCTCAT GTTGAAGTGC 
AGAAGCAGCT GCAGTGTTGC 
ACATTTTTTC TTTGGTCAGA 

40 GGCCAGGTGT GGTGGCTCAC 

TCACAAAGTC AGGACGAGAC 
TACAAAAAAA AAT TAGCTAG 
CTGAAGCAGG AGAATGGTAT 
CACTGCACTC CAGCCTGGGC 

45 ACGCGTACCT GCGGTGAGGA 

TCCCCGTGTT CACTTGCTCC 
GGGGAGCAGA CAAAGATGAG 
T TAG CACCAA ACTTCTACAA 
AGAATGGTAC TTAGGGATGG 

50 CTGTGTGTAT GCATACATAT 

TTGTTTCCTT TATATATGTA 
AAAGCTTAAT TGT CCCAGAA 
AACCTGGGGG CCTGTGAAAC 
AGAGATCAGG GGTTACCTCT 

55 CTACCCTACT TTTCAGCAGC 

TGT TAG CAGG AGCTATGTCC 



PCT/US02/12476 



GGCCAGGGCC 
GCTACTCTGG 
AAGCGCCCTC 
CCAAACATCC 
GCTACCTGTG 
CGGCCTCTGA 
AGTGGTTTGT 
GCCCAGTTTT 
AGGGAAGTCA 
GTGGGAATGC 
CCACCACACT 
ACCAACGACA 
GAATGTCAGG 
CTGGTGAACT 
AGCAGCCTCA 
AGAGAAGAGA 
CGGGAGGCAG 
CGCACACAGC 
AAGGTGTGGG 
CGGCCCACCA 
CGAGTCCTGA 
TGCACGGCCT 
TTAACCACCC 
CCTCATACCA 
GGCGTGGTCA 
CTCTATTTCC 
ACGCTGCCCC 
GAAGAGATGG 
GAGAAATACA 
ACCATTCCCA 
AAGCCTCCTG 
AGGACCTCAC 
CGTTGAGTGA 
CTTGCAGAAC 
CAGCTGAGCT 
CCAGGTGCAC 
GCTGTTCACA 
TGCCACCACC 
AGCCAGGAAC 
GCCTGTAATC 
CATCCTGGCT 
GCGTAGTGGT 
GAAT CCAGGA 
AACACAGCGA 
AGCTGGGCGC 
CATAGCCCTC 
GTCTACACTG 
ACCAAGCTCA 
AAAACGGGGC 
GTGTGTATAT 
TGTATATATA 
AAT CATACAT 
TACAACCAAA 
GCTTCTGAGC 
AAAACGTCCC 
CTTCCTATCG 



AGAGCGAACC 
CCCTGACTCA 
GGT CCCAGGA 
AGGTCAACCC 
TAGGGAGGAA 
AGGAGGAGAA 
ACACCTTGCA 
ACTGTGAGCT 
CCGTCCCTGT 
TGAAGGAAGG 
T CAG CATCAG 
ACGGGGTCCT 
CCTGGAACTT 
ATGTGTCTGA 
CCCTGACCTG 
CAGACCAGGT 
GAGGCGGCTA 
TGGTCAAGCT 
TGAAAGAGAA 
TCTCCTGGAA 
GCACCCTGAA 
CCAACGACCT 
TCACACCAGA 
GAGCCAACAG 
TCGTGGCTGT 
TCTATAAGAA 
CGTCTCGTAA 
GCCTCCTGCA 
TCGATCTGAG 
GCTCCCTGCT 
CTCCCCTCAC 
TTGGCCCTGC 
AGCTCATCCC 
GTGTTTTTTC 
GGGTAGCCTC 
CACTGAAGTG 
CCCGCTCCGG 
CTCCTGCTCG 
TGGTGTCATT 
CCAGCACTTT 
AACACGGTGA 
TGGCACCTAT 
GGTGGAGCTT 
GACTCCGTCT 
TGTTTTCGAG 
TTGATGGATC 
TCCTTCATGG 
GGGCCCCAAC 
CTGGCTAGAG 
ATGGTTT TGT 
TATATGAAAA 
TGCTTTTTTA 
AGGCACACAA 
AAATGGCTCA 
GTATGACGCA 
TTTCCGTCCA 



TGGGGAGTAC 


GAGCAGCGGC 


300 


AGTCACCCCC 


CAAGACGAGC 


360 


GTACCGCATC 


CAGCTCCGCG 


420 


CCTGGGCATC 


CCTGTGAACA 


480 


CGGGTACCCC 


ATTCCTCAAG 


540 


GAACCGGGTC 


CACATT CAGT 


600 


G AGT AT T CTG 


AAGGCACAGC 


660 


CAACTACCGG 


CTGCCCAGTG 


720 


TTTCTACCCG 


ACAGAAAAAG 


780 


GGACCGCGTG 


GAAAT CAGGT 


840 


CAAGCAGAAC 


CCCAGCACCA 


900 


GGTGCTGGAG 


CCTGCCCGGA 


960 


GGACACCATG 


ATATCGCTGC 


1020 


CGTCCGAGTG 


AGTCCCGCAG 


1080 


TGAGGCAGAG 


AGTAGCCAGG 


1140 


GCTGGAAAGG 


GGGCCTGTGC 


1200 


TGGCTGCGTG 


GCGTCTGTGC 


1260 


nnrrATTTTT 

Ww^v**l X X X X 


GGCCCCCCTT 


1320 


T A Tf^ ftTfi T TCt- 


AAT CTGT C T T 

*TLJtX X X w X »■ X X 


1380 


CGTGAACGGC 


ACGGCAAGTG 


1440 


X W X *w X X v_j 


ACCCCGGAGC 


1500 


GGGCAAAAAC 


ACCAGCAT CC 


1560 


CT CGAACACA 


ACCACTGGCC 


1620 


GACCTCCACA 


GAGAGAAAGC 


1680 


GATTGTGTGC 


ATCCTGGTCC 


1740 . 


GGGCAAGCTG 


CCGTGCAGGC 


1800 


GACCGAACTT 


GTAGTTGAAG 


1860 


GGGCAGCAGC 


GGTGACAAGA 


1920 


GCATTAGCCC 


CGAATCACTT 


1980 


CACTCTTCTC 


TCAGCCAAAG 


2040 


CTdClACACCC 


CCTTTCAGAG 


2100 


AAGCCGCTTT 


TCAGGGACCA 


2160 


AAGCAAGGAG 

AriW VJVJ^l VJ 


CCCCAGTCTC 


2220 


TTTACACACA 


TTATGGCTGT 


2280 


TCTGAGCTGG 


TTTCCTGCCC 


2340 


AGGACACACC 


GGAGCCAGGC 

\j\Jfl^J ^a-i*\J W 


2400 


AGAGCACCCC 


AGCGGCATCC 


2460 


CCTGTTCAAA 


GTCTCCTGTG 

Va^ X A ^a# V at A 


2520 


CCTTAAAAGA 


TACGTGCCGG 


2580 


GGGAGGCCGA 


GGCGGGCGGA 

^■1 ^^a>^a»^a1 ^a< ^p#aV * 


2640 


AACCCTGTCT 

A a* A Va» afc X A 


CTACTAAAAA 

*aj* afc a\ aV ^ * *a* aVaV aa aa aV 


2700 


AGTCCCAGCT 


ACTCGGAAGG 


2760 


GCAGTGAGCC 


GAGACCGTGC 


2820 


CGAGGAAAAA 


AAAAGAAAAG 

av la * * » * aa^a*a\ aa ■ a a a aa^af 


2880 


TTGAGGTGAA 


TTAGCCTCAA 


2 940 


AGGTAAAACT 


GAAAGGCAGC 


3000 

^a* W W V 


GGATTAAAGC 


TATGGTTATA 

X aVal X 'a-J ^ aL aVaV aaa il a. 


3060 


CGTAGAAGGG 


CCCAAATGAG 


3120 

_j -a- *j <y 


CTTGGGGTGT 


GTGTGTCTGT 


3180 




ZV ZV T T TG P A A ZV 


1240 


TATATATATA 


TATGAAAAAT 


3300 


TTCTACATGG 


GTACCACAGG 


3360 


AACCGTTTCC 


AGTTGGCAGC 


3420 


AGCTCTACCA 


GAGCAGACAG 


3480 


GCACGAAGGG 


CCTGGCAGGC 


3540 


CTT 







Seq ID NO: 120 Protein sequence: 
60 Protein Accession #: NP 006491.1 



65 



70 



75 



MGLPRLVCAF 
DWFSVHKEKR 
PRSQEYRIQL 
LKEEKNRVHI 
VTVPVFYPTE 
DNGVLVLEPA 
LTLTCEAESS 
QLVKLAIFGP 
LSTLNVLVTP 
TRANSTSTER 
PPSRKTELW 



11 
I 

LLAACCCCPR 
TLIFRVRQGQ 
RVYKAPEEPN 
QSSQTVESSG 
KVWLEVEPVG 
RKEHSGRYEC 
QDLEFQWLRE 
PWMAFKERKV 
ELLETGVECT 
KLPEPESRGV 
EVKSDKLPEE 



21 
I 

VAGVPGEAEQ 
GQSEPGEYEQ 
IQVNPLGIPV 
LYTLQSILKA 
MLKEGDRVE I 
QAWNLDTMIS 
ETDQVLERGP 
WVKENMVLNL 
ASNDLGKNTS 
VIVAVIVCIL 
MGLLQGSSGD 



31 

I 

PAPELVEVEV 
RLSLQDRGAT 
NSKEPEEVAT 
QLVKEDKDAQ 
RCLADGNPPP 
LLSEPQELLV 
VLQLHDLKRE 
SCEASGHPRP 
ILFLELVNLT 
VLAVLGAVLY 
KRAPGDQGEK 



41 


51 




1 

GSTALLKCGL 


1 

SQSQGNLSHV 


60 


LALTQVTPQD 


ERIFLCQGKR 


120 


CVGRNGYPIP 


QVIWYKNGRP 


180 


FYCELNYRLP 


SGNHMKESRE 


240 


HFSISKQNPS 


TREAEEETTN 


300 


NYVSDVRVSP 


AAPERQEGSS 


360 


AGGGYRCVAS 


VPSIPGLNRT 


420 


T I SWNVNGTA 


SEQDQDPQRV 


480 


TLTPDSNTTT 


GLSTSTASPH 


540 


FIiYKKGKLPC 


RRSGKQEITL 


600 


YIDLRH 







80 



85 



Seq ID MO: 121 DNA sequence 
Nucleic Acid Accession #: NM_018306 
Coding sequence: 60-671 



ATAGTCTACA 
TGGAGACTTC 
AAGATGTAGA 
CCCAAGAACA 
CCTCATCTTC 



11 

I 

CAGAGCTCCC 
AGCATCCTCC 
CTATGGAGAG 
ATATGAGAGA 
TTCATCCTCC 



21 
I 

CTTGCTGCCC 
TCCCAGCCTC 
ACAGATTTCC 
AACAAGTCTT 
TCCTCCTCAG 



31 



AGACAAGCTG 
AGGACAACAG 
ACAAGCAAGA 
CTTCCTCCTC 
GTCCTGGGCA 



41 

1 

AAGGACCACA 
TCAAGTCCAC 
CGGGAAGGCT 
CTTCTCTTCC 
TGGGGAGCCT 



51 

I 

GGAAAAGCCA 60 

AGAGAAACAG 12 0 

GGACTCTTTT 180 

TCCTCATCCT 240 

GACGTTTTGA 3 00 



234 



10 



15 



20 



WO 02/086443 

AGGATGAGCT TCAACTCTAT 
GACTCCGAAG GAGAGG CTCT 
GACTGAATAT AAAGAAAGAT 
GGGCCTTGCT GGTGTGTTAT 
TGCTCACCTT CGCCTCCCTG 
ACAGCGTCCT CCAAGGCTTC 
AGACTGACTG AGGCCACTTC 
GCGACCCCTG AGCCCACAAG 
AGACCAATAA ACAGAACACT 
AGGGGCATCT CATTTGGGCA 
GGTGGGTGTG GGGCCTGAGG 
ACTGCTCTCA GAGGACAGCA 
ATGGTTTTTC TCAAATCCCA 
GGGAGAGATG GATGGTCCAC 
GAACCTGATG CAGGTAAGAT 
GGCAGGAAAA TGATCAT CAG 
TCCTCGCACT TTGGGAGGCT 
CTGGGCAACA TAGTGAGACC 
TACATACCTG TACATACCTG 
TGAGCCCAGG AGTTCAGGGC 
CGACAGAGCA AGATCGTTTC 



GGAGATGCTC 
GACCCAGCAA 
GATGAGT TTT 
CACTATTACG 
GAAACCGTTG 
ATCCCCCTCT 
CAGGTGGGCA 
GGCAGAGCAG 
TTTCCTTCCA 
GTACTGCTGT 
CTTCACAGTA 
AGGGACCCTG 
GGCTATCTGC 
TGCTTTGAGG 
GCTGAGGACT 
AAACTAAATG 
CAGGCTAAGG 
CCCATCTCTA 
CGGTTCCAGC 
TGCAGTGAGG 
TCTAAAATT 



CTGGAGAGGT 
GTGGAGAAGT 
TCCATTTCGT 
CAGACTGGTT 
GCATCTACTT 
TCCAGAAGTT 
GCAGAGGCAG 
CATTCTGAGA 
TGTGGTCTGA 
GCAACCCAGC 
CCTGGACCAG 
AGCT CTGCAA 
ATGCGCTCTC 
CAGGGAGCCA 
AAAACCATTT 
GCAGCCAGGC 
GTCGCTTGAA 
CAATTTTTTT 
TACTCAAGAG 
TACGATCAAG 



GGTACCCTCT 
GGAGGCCTCT 
CCTCCTGTGC 
CATGTCTCTT 
CGGACTAGTG 
TAGGCTGACA 
GCCCCAGTGT 
GACGCACAGG 
ATGTTGGCAC 
TGCAAGGATG 
CAGGAAGATT 
GCTGTGATCT 
AGGTGCTACC 
TCGGGCTGGG 
TTTTTGCACC 
ATGGGGGCTC 
GCTGAGAGTT 
TTAATGACCA 
GCTGAGGCAG 
CCACTGCACT 



GGGGAATCAG 3 60 

CAGTTAAGAA 420 

TTTGCCATCG 480 

GGGGTCGGCC 540 

TACCGTAT CC 60 0 

GGGTTCAGGA 660 

GACCACCACT 72 0 

AGACCAAGCC 780 

CAGCCCGGGC 840 

GAAGGCAGAG 90 0 

CTGGGAGGTC 960 

GTCTGGGTTC 1020 

GAGCCATCCT 10 80 

GCCCCTTGGT 1140 

CAAAAAAAAA 12 0 0 

ACGACTGTAA 12 60 

CAAGACCAAC 1320 

AATGTGGCGG 13 80 

GAGGACTGCT 1440 

CCAGCCTGGG 150 0 



PCT/US02/12476 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



Seq ID NO: 122 Protein sequence: 
Protein Accession ft: NP__060776 

1 11 21 31 41 51 

I l I l l l 

METSASSSQP QDNSQVHRET EDVDYGETDF HKQDGKAGLF SQEQYERNKS SSSSFSSSSS 
SSSSSSSSSS GPGHGEPDVL KDELQLYGDA PGEWPSGES GLRRRGSDPA SGEVEASQLR 
RLNIKKDDEF FHFVLLCFAI GALLVCYHYY ADWFMSLGVG LLTFASLETV GIYFGLVYRI 
HSVLQGFIPL FQKFRLTGFR KTD 

Seq ID NO: 123 DNA sequence 
Nucleic Acid Accession #: BC022542 
Coding sequence: 243.. 896 



11 



21 



31 



41 



51 



I 

ACTTGGTCCC AGCCGATAAA TCTGGGGCAG CGCGCGGTAG GAGCTGCGGG CGGCCAGGCC 
CCTTCCTGCG TCCGCACCTG GCCCCGCGCG CCCCTCTCGG GCGTCCGGCT TCCGGCGTCC 
TGGCGGCTCG GGTGGCGGCG GTTCGGGCGG CCGCCTGGCT GCTCCTCGGG GCGGCGACGG 
GGCT CACGCG CGGGCCCGCC ACGGCCTTCA CCGCCGCGCG CTCTGACGCC GGCATAAGGG 
CCATGTGTTC TGAAATTATT TTGAGGCAAG AAGTTTTGAA AGATGGTTTC CACAGAGACC 
TTTTAATCAA AGTGAAGTTT GGGGAAAGCA TTGAGGACTT GCACACGTGC CGTCTCTTAA 
TTAAACAGGA CATTCCTGCA GGACTTTATG TGGATCCGTA TGAGTTGGCT TCATTACGAG 
AGAGAAACAT AACAGAGGCA GTGATGGTTT CAGAAAATT T TGATATAGAG GCCCCTAACT 
ATTTGTCCAA GGAGT CTGAA GTTCTCATTT ATGCCAGACG AGATTCACAG TGCATTGACT 
GTTTTCAAGC CTTTTTGCCT GTGCACTGCC GCTATCATCG GCCGCACAGT GAAGATGGAG 
AAGCCT CGAT TGTGGT CAAT AACCCAGATT TGTTGATGTT TTGTGACCAA GAGTTCCCGA 
TTTTGAAATG CTGGGCTCAC TCAGAAGTGG CAGCCCCTTG TGCTTTGGAT AATGAGGATA 
TATGCCAATG GAACAAGATG AAGTATAAAT CAGTATATAA GAATGTGATT CTACAAGTTC 
CAGTGGGACT GACTGTACAT ACCTCTCTAG TATGTTCTGT GACTCTGCTC ATTACAATCC 
TGTGCTCTAC ATTGATCCTT GTAGCAGTTT TCAAATATGG CCATTTTTCC CTATAAGTTT 
TATGTAGTTA AATGCTTCCT AGAAACCTAA ATAAGATCTA TTAATTT CTG ACGAGAGGTG 
TTCTTCTAGA ATTAATTACT TTTATCTTTT GTCTTCATTT GTGGCCAAAA TTATGTTTAC 
TAGAGGAAAT TTGGGATCAT TCTCAGCTAA TTCCAAAATG TAGTGCTCTA TTGCATGGAT 
CCTTGGTAAT CCTCAAGCAT CAGATGCCAT AAGGGGAAAC TTAATTCTGC TAAATTAATG 
TTTATTTTGT GAGAAGTGAC TTTATCTTCA TTTGGGGTAG AAAAATTATT TCTTTATGTA 
GTAGAGACAA ATTATTCTCA TTTTGCAAGT ACTTTCAATT TAAGCTACAA AT TG AG AAAA 
CCGTTATAAA TAAGAATAAA ATAGGCCAGG CACAGTGGCT CACACCTGTA AT GCCAGCAC 
TTTGGGAGGC CGAGGTGGGC GGATCACCAG AGGTCAAGAG TTTGAGACCA GCTTGGTGAA 
ACCCTGTCTC TACTAAAAAT ACAAAAGTTA GCTGGGGCTG GTGGTGGGCA TCTGTAGTCC 
CAGCTAATTG GAAGGGTGAG GCGGGAGGAT CGCTTGAACC TGGGAGGCGG AGGTTCCAGA 
GAGCCAAGAT CGCACCACTG CACTACAGCC TGGGCGACAG AACGAGACCC TGTCTCCAAA 
GGAAAAACAA AAAAGAAGAA TAAAATAATT TGGATGAAAA TCATGTTTAT TTAAATAGTA 
ATGT CATG AG ACTATTAAAG ATGTGCCAGA GTTTCAATGA AAATCATTAA AGTAGGACAG 
CTAAGAAATT AATATTAATA TAAAAATTAT TGATAAT CTT AAATTATTGA TTATTCCTTA 
ACGCACTCCA TTCTCCTTTT ACATTTTATC ATGTTTCTTT TGAATATATG AATTGGCAAA 
GGACTTGATG AAACTGAGTA CTAAGATTTG GTACAGAGTA TGT CAGGAAG ACAACTCAGA 
TTGCCATTTT AAATAAAGTT GTACATGAAC AAAAAAAAAA AAAAAA 
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60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
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1680 
1740 
1800 
1860 



Seq ID NO: 124 Protein sequence: 
75 Protein Accession #: AAH22542 

1 11 21 31 41 51 

l l l I I l 

MCSEIILRQE VLKDGFHRDL LIKVKFGESI EDLHTCRLL I KQDIPAGLYV DPYELASLRE 
80 RNITEAVMVS ENFDIEAPNY LSKESEVLIY ARRDSQCIDC FQAFLPVHCR YHRPHSEDGE 

AS I WNNPDL LMFCDQAGSR RMIRFRFDSF DKTIEFPILK CWAHSEVAAP CADENEDICQ 
WNKMKYKSVY KNVILQVPVG LTVHTSLVCS VTLLITILCS KKKKK 

Seq ID NO: 125 DNA sequence 
85 Nucleic Acid Accession #: NM_004994.1 
Coding sequence: 20.. 2143 
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WO 02/086443 

i n 

I I 

AGACACCTCT GCCCTCACCA 
GGGCTGCTGC TTTGCTGCCC 
CCTGAGAACC AATCTCACCG 
CACTCGGGTG GCAGAGATGC 
CCAGAAGCAA CTGTCCCTGC 
GCGAACCCCA CGGTGCGGGG 
CAAGTGGCAC CACCACAACA 
GGCGGTGATT GACGACG CCT 
CACCTTCACT CGCGTGTACA 
GCACGGAGAC GGGTATCCCT 
TGGCCCCGGC ATT CAGGGAG 
GGGCGTCGTG GTTCCAACTC 
CATCTTCGAG GGCCGCTCCT 
CTGGTGCAGT ACCACGGCCA 
GAGACTCTAC ACCCGGGACG 
CCAAGGCCAA TCCTACTCCG 
CGCCACCACC GCCAACTACG 
CTCGACGGTG ATGGGGGGCA 
GGGTAAGGAG TACTCGACCT 
TAGCACCTCG AACTTTGACA 
TTTGTTCCTC GTGGCGGCGC 
GCCGGAGGCG CTCATGTACC 
CGACGTGAAT GGCATCCGGC 
AACCACCACC ACACCGCAGC 
TGTCCACCCC TCAGAGCGCC 
AGGTCCCCCC ACTGCTGGCC 
TGCCTGCAAC GTGAACATCT 
CAAGGATGGG AAGTACTGGC 
CCTTATCGCC GACAAGTGGC 
GCTCTCCAAG AAGCTTTTCT 
GGTGCTGGGC CCGAGGCGTC 
CGGGGCCCTC CGGAGTGGCA 
GTTCGACGTG AAGGCGCAGA 
CCCCGGGGTG CCTTTGGACA 
CCAGGACCGC TTCTACTGGC 
GGGCTACGTG ACCTATGACA 
GCAGTGCCAT GTAAATCCCC 
CAAACTGGTA TTCTGTTCTG 
TCACCTTTGT TTTTTGTTGG 



21 
I 

TGAGCCTCTG 
CCAGACAGCG 
ACAGGCAGCT 
GTGGAGAGTC 
CCGAGACCGG 
TCCCAGACCT 
TCACCTATTG 
TTGCCCGCGC 
GCCGGGACGC 
TCGACGGGAA 
ACGCCCATTT 
GGTTTGGAAA 
ACTCTGCCTG 
ACTACGACAC 
GCAATGCTGA 
CCTGCACCAC 
ACCGGGACAA 
ACTCGGCGGG 
GTACCAGCGA 
GCGACAAGAA 
ATGAGTTCGG 
CTATGTACCG 
ACCTCTATGG 
CCACGGCTCC 
CCACAGCTGG 
CTTCTACGGC 
TCGACGCCAT 
GATTCTCTGA 
CCGCGCTGCC 
TCTTCTCTGG 
TGGACAAGCT 
GGGGGAAGAT 
TGGTGGATCC 
CGCACGACGT 
GCGTGAGTTC 
TCCTGCAGTG 
ACTGGGACCA 
GAGGAAAGGG 
AGTGTTTCTA 
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31 

I 

GCAGCCCCTG 
CCAGTCCACC 
GGCAGAGGAA 
GAAATCTCTG 
TGAGCTGGAT 
GGGCAGATTC 
GATCCAAAAC 
CTTCGCACTG 
AGACATCGTC 
GGACGGGCTC 
CGACGATGAC 
CGCAGATGGC 
CACCACCGAC 
CGACGACCGG 
TGGGAAACCC 
GGACGGTCGC 
GCTCTTCGGC 
GGAGCTGTGC 
GGGCCGCGGA 
GTGGGGCTTC 
CCACGCGCTG 
CTTCACTGAG 
TCCTCGCCCT 
CCCGACGGTC 
CCCCACAGGT 
CACTACTGTG 
CGCGGAGATT 
GGGCAGGGGG 
CCGCAAGCTG 
GCGCCAGGTG 
GGGCCTGGGA 
GCTGCTGTTC 
CCGGAGCGCC 
CTTCCAGTAC 
CCGGAGTGAG 
C CCTGAGG AC 
ACCCTGGGGA 
AGGAGTGGAG 
ATAAACTTGG 



Seq ID NO: 126 Protein sequence: 
Protein Accession #: NP 004985.1 



11 



MSLWQPLVLV 
RGESKSLGPA 
ITYWIQNYSE 
FDGKDGLLAH 
YSACTTDGRS 
ACTTDGRSDG 
CTSEGRGDGR 
PMYRFTEGPP 
PTAGPTGPPS 
RFSEGRGSRP 
LDKLGLGADV 
THDVFQYREK 



LLVLGCCFAA 
LLLLQKQLSL 
DLPRAVIDDA 
AFPPGPGIQG 
DGLPWCSTTA 
YRWCATTANY 
LWCATTSNFD 
LHKDDVNG I R 
AGPTGPPTAG 
QGPFLIADKW 
AQVTGALRSG 
AYFCQDRFYW 



21 
I 

PRQRQSTLVL 
PETGELD SAT 
FARAFALWSA 
DAHFDDDELW 
NYDTDDRFGF 
DRDKLFGFCP 
SDKKWGFCPD 
HLYGPRPEPE 
PSTATTVPLS 
P ALPRKLD S V 
RGKMLLFSGR 
RVSSRSELNQ 



31 
I 

FPGDLRTNLT 
LKAMRTPRCG 
VTPLTFTRVY 
SLGKGVWPT 
CPSERLYTRD 
TRADSTVMGG 
QGYSLFLVAA 
PRPPTTTTPQ 
PVDDACNVNI 
FEEPLSKKLF 
RLWRFDVKAQ 
VDQVGYVTYD 



Seq ID NO: 127 DNA sequence 
Nucleic Acid Accession #: NM_004181 
Coding sequence: 32-670 



I 

GCAGAAATAG 
GGTCGCCGGC 
GGTGCCAGCG 
CTTCAGGAAA 
CATGAAGCAG 
TAATCAAGAC 
AGAGAAAATG 
AGCCCATGAT 
TTTTATTCTG 
TCCGGTGAAC 
CAGAGAATTC 
GGCAGCCTAA 
AATATATACC 
TGTTCTGCAG 
ACAGCTGTCC 
TATGTCTTGT 
AAGACCTTGG 



11 
I 

CCTAGGGAGA 
CAGTGGCGCT 
CCTGCCTGCG 
AAGCAGATTG 
ACCATTGGGA 
AAACTGGGAT 
TCCCCTGAAG 
GCCGTGGCAC 
TTTAACAACG 
CATGGCGCCA 
ACCGAGCGTG 
TGCTCTGTGG 
CCCCATGCAG 
ACACGCCTTC 
ACTGGGCCAT 
AT CCGATATC 
ATGTGGTTAT 



21 
] 

TCAACCCCGA 
TCGTGGACGT 
CGCTGCTGCT 
AAGAGCTGAA 
ATTCCTGTGG 
TTGAGGATGG 
ACAGAGCAAA 
AGGAAGGCCA 
TGGATGGCCA 
GTT CAGAGGA 
AGCAAGGAGA 
GAGGGACTTT 
TCTAAAATGC 
CCCTCAGCCA 
TGTGGTGTGA 
TAACGCTTTA 
GTTGTCCTAA 



31 



GATGCTGAAC 
GCTGGGGCTG 
GCTGTTTCCC 
GGGACAAGAA 
CACAAT CGG A 
ATCAGTTCTG 
ATGCTTTGAA 
ATGTCGGGTA 
CCTCTATGAA 
CACCCTGCTG 
AGTCCGCTTC 
GCTGATTTCC 
TTCAGTACTT 
CACCCAGGCA 
GCTTCAGATG 
AATGGCTACT 
AGAATAAATT 
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Seq ID NO: 128 Protein sequence: 
Protein Accession #: NP_004172 
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WO 02/086443 PCT/US02/12476 

1 11 21 31 41 51 

i I I I I I 

MLNKVLSRLG VAGQWRFVDV LGLEEESLGS VPAPACALLL LFPLTAQHEN FRKKQIEELK 60 
GQEVSPKVYF MKQTIGNSCG TIGLIHAVAN NQDKLGFEDG SVLKQFLSET EKMSPEDRAK 120 
5 CFEKNEAIQA AHDAVAQEGQ CRVDDKVNFH FILFNNVDGH LYELDGRMPF PVNHGASSED 180 

TLLKDAAKVC REFTEREQGE VRFSAVALCK AA 



Seq ID NO: 129 DNA sequence 
10 Nucleic Acid Accession #: NM_000213 
Coding sequence: 127-53 85 

1 11 21 31 41 51 

1C I i i i i I 

1 J CGCCCGCGCG CTGCAGCCCC ATCTCCTAGC GGCAGCCCAG GCGCGGAGGG AGCGAGTCCG 60 

CCCCGAGGTA GGTCCAGGAC GGGCGCACAG CAGCAGCCGA GGCTGGCCGG GAGAGGGAGG 120 

AAGAGGATGG CAGGGCCACG CCCCAGCCCA TGGGCCAGGC TGCTCCTGGC AGCCTTGATC 180 

AGCGTCAGCC TCTCTGGGAC CTTGGCAAAC CGCTGCAAGA AGGCCCCAGT GAAGAGCTGC 240 

ACGGAGTGTG TCCGTGTGGA TAAGGACTGC GCCTACTGCA CAGACGAGAT GTTCAGGGAC 300 

20 CGGCGCTGCA ACACCCAGGC GGAGCTGCTG GCCGCGGGCT GCCAGCGGGA GAG CATCGTG 360 

GTCATGGAGA GCAGCTTCCA AATCACAGAG GAGACCCAGA TTGACACCAC CCTGCGGCGC 420 

AGCCAGATGT CCCCCCAAGG CCTGCGGGTC CGTCTGCGGC CCGGTGAGGA GCGGCATTTT 480 

GAGCTGGAGG TGTTTGAGCC ACTGGAGAGC CCCGTGGACC TGTACATCCT CATGGACTT C 540 

TCCAACTCCA TGTCCGATGA TCTGGACAAC CTCAAGAAGA TGGGGCAGAA CCTGGCTCGG 600 

25 GTCCTGAGCC AGCTCACCAG CGACTACACT ATTGGATTTG GCAAGTTTGT GGACAAAGTC 660 

AGCGTCCCGC AGACGGACAT GAGGCCTGAG AAGCTGAAGG AGCCCTGGCC CAACAGTGAC 720 

CCCCCCTTCT CCTTCAAGAA CGTCATCAGC CTGACAGAAG ATGTGGATGA GTTCCGGAAT 780 

AAACTGCAGG GAG AG CGGAT CTCAGGCAAC CTGGATGCTC CTGAGGGCGG CTTCGATGCC 840 

ATCCTGCAGA CAGCTGTGTG CACGAGGGAC ATTGGCTGGC GCCCGGACAG CACCCACCTG 90 0 

30 CTGGTCTTCT CCACCGAGTC AGCCTTCCAC TATGAGGCTG ATGGCGCCAA CGTGCTGGCT 960 

GGCATCATGA GCCGCAACGA TGAACGGTGC CACCTGGACA CCACGGGCAC CTACACCCAG 1020 

TACAGGACAC AGGACTACCC GTCGGTGCCC ACCCTGGTGC GCCTGCTCGC CAAGCACAAC 1080 

ATCATCCCCA TCTTTGCTGT CACCAACTAC TCCTATAGCT ACTACGAGAA GCTTCACACC 1140 

TATTTCCCTG TCTCCTCACT GGGGGTGCTG CAGGAGGACT CGT CCAACAT CGTGGAGCTG 1200 

35 CTGGAGGAGG CCTTCAATCG GATCCGCTCC AACCTGGACA TCCGGGCCCT AGACAGCCCC 1260 

CGAGGCCTTC GGACAGAGGT CACCTCCAAG ATGTTCCAGA AGACGAGGAC TGGGTCCTTT 132 0 

CACATCCGGC GGGGGGAAGT GGGTATATAC CAGGTGCAGC TGCGGGCCCT TGAGCACGTG 13 80 

GATGGGACGC ACGTGTGCCA GCTGCCGGAG GACCAGAAGG GCAACAT CCA TCTGAAACCT 1440 

TCCTTCTCCG ACGGCCTCAA GATGGACGCG GGCAT CATCT GTGATGTGTG CACCTG CGAG 1500 

40 CTGCAAAAAG AGGTGCGGTC AGCTCGCTGC AGCTTCAACG GAGACTTCGT GTGCGGACAG 1560 

TGTGTGTGCA GCGAGGGCTG GAGTGGCCAG ACCTGCAACT GCTCCACCGG CTCTCTGAGT 1620 

GACATTCAGC CCTGCCTGCG GGAGGGCGAG GACAAGCCGT GCTCCGGCCG TGGGGAGTGC 1680 

CAGTGCGGGC A CTGT GTGTG CTACGGCGAA GGCCGCTACG AGGGT CAGTT CTGCGAGTAT 1740 

GACAACTTCC AGTGT CCCCG CACTTCCGGG TTCCTCTGCA ATGACCGAGG ACGCTGCTCC 1800 

45 ATGGGCCAGT GTGTGTGTGA GCCTGGTTGG ACAGGCCCAA GCTGTGACTG TCCCCTCAGC 1860 

AATGCCACCT GCATCGACAG CAATGGGGGC AT CTGTAATG GACGTGGCCA CTGTGAGTGT 1920 

GGCCGCTGCC ACTGCCACCA GCAGTCGCTC TACACGGACA CCATCTGCGA GATCAACTAC 1980 

TCGGCGATCC ACCCGGGCCT CTGCGAGGAC CTACGCTCCT GCGTGCAGTG CCAGGCGTGG 2 040 

GGCACCGGCG AGAAGAAGGG GCGCACGTGT GAGGAATGCA ACTTCAAGGT CAAGATGGTG 210 0 

50 GACGAGCTTA AGAGAGCCGA GGAGGTGGTG GTGCGCTGCT CCTTCCGGGA CGAGGATGAC 2160 

GACTGCACCT ACAGCTACAC CATGGAAGGT GACGGCGCCC CTGGGCCCAA CAGCACTGTC 2220 

CTGGTGCACA AGAAGAAGGA CTGCCCTCCG GGCTCCTTCT GGTGGCTCAT CCCCCTGCTC 2280 

CTCCTCCTCC TGCCGCTCCT GGCCCTGCTA CTGCTGCTAT GCTGGAAGTA CTGTGCCTGC 2340 

TGCAAGGCCT GCCTGGCACT TCTCCCGTGC TGCAACCGAG GTCACATGGT GGGCTTTAAG 2400 

55 GAAGACCACT ACATGCTGCG GGAGAACCTG ATGG CCTCTG ACCACT TGGA CACGCCCATG 2460 

CTGCGCAGCG GGAACCTCAA GGGCCGTGAC GTGGTCCGCT GGAAGGTCAC CAACAACATG 2520 

CAGCGGCCTG GCTTTGCCAC TCATGCCGCC AGCATCAACC CCACAGAGCT GGTGCCCTAC 2580 

GGGCTGTCCT TGCGCCTGGC CCGCCTTTGC ACCGAGAACC TGCTGAAGCC TGACACTCGG 2640 

GAGTGCGCCC AGCTGCGCCA GGAGGTGGAG GAGAACCTGA ACGAGGTCTA CAGG CAGATC 2700 

60 T CCGGTGT AC ACAAGCTCCA GCAGACCAAG TTCCGGCAGC AGCCCAATGC CGGGAAAAAG 2 760 

CAAGACCACA CCATTGTGGA CACAGTGCTG ATGGCGCCCC GCTCGGCCAA GCCGGCCCTG 2 82 0 

CTGAAGCTTA CAGAGAAGCA GGTGGAACAG AGGGCCTTCC ACGACCTCAA GGTGGCCCCC 2 880 

GGCTACTACA CCCTCACTGC AGACCAGGAC GCCCGGGGCA TGGTGGAGTT CCAGGAGGGC 2 940 

GTGGAGCTGG TGGACGTACG GGTGCCCCTC TTTATCCGGC CTGAGGATGA CGACGAGAAG 3000 

65 CAGCTGCTGG TGGAGGCCAT CGACGTGCCC GCAGGCACTG CCACCCTCGG CCGCCGCCTG 3060 

GTAAACATCA CCAT CATCAA GGAGCAAGCC AGAGACGTGG TGTCCTTTGA GCAGCCTGAG 3120 

TTCTCGGTCA GCCGCGGGGA CCAGGTGGCC CGCATCCCTG TCATCCGGCG TGTCCTGGAC 3180 

GGCGGGAAGT CCCAGGTCTC CTACCGCACA CAGGATGGCA CCGCGCAGGG CAACCGGGAC 3240 

TACATCCCCG TGGAGGGTGA GCTGCTGTTC CAGCCTGGGG AGGCCTGGAA AGAGCTGCAG 3300 

70 GTGAAGCTCC TGGAGCTGCA AG AAGTT G AC TCCCTCCTGC GGGGCCGCCA GGTCCGCCGT 3 360 

TTCCACGTCC AGCTCAGCAA CCCTAAGTTT GGGGCCCACC TGGGCCAGCC CCACTCCACC 342 0 

ACCATCATCA TCAGGGACCC AGATGAACTG GACCGGAGCT TCACGAGTCA GATGTTGTCA 3 480 

TCACAGCCAC CCCCTCACGG CGACCTGGGC GCCCCGCAGA ACCCCAATGC TAAGGCCGCT 3 540 

GGGT CCAGGA AGATCCATTT CAACTGGCTG CCCCCTTCTG GCAAGCCAAT GGGGTACAGG 3600 

75 GTAAAGTACT GGATTCAGGG TGACTCCGAA TCCGAAGCCC ACCTGCTCGA CAGCAAGGTG 3660 

CCCTCAGTGG AGCTCACCAA CCTGTACCCG TATTGCGACT ATGAGATGAA GGTGTGCGCC 372 0 

TACGGGGCTC AGGGCGAGGG ACCCTACAGC TCCCTGGTGT CCTGCCGCAC CCACCAGGAA 3780 

GTGCCCAGCG AGCCAGGGCG TCTGGCCTTC AATGTCGTCT CCTCCACGGT GACCCAGCTG 3840 

AGCTGGGCTG AGCCGGCTGA GACCAACGGT GAGATCACAG CCTACGAGGT CTGCTATGGC 3900 

80 CTGGTCAACG ATGACAACCG ACCTATTGGG CCCATGAAGA AAGTGCTGGT TGACAACCCT 3960 

AAGAACCGGA TGCTGCTTAT TGAGAACCTT CGGGAGTCCC AGCCCTACCG CTACACGGTG 402 0 

AAGGCGCGCA ACGGGGCCGG CTGGGGGCCT GAGCGGGAGG CCAT CATCAA CCTGGCCACC 4080 

CAGCCCAAGA GGCCCATGTC CATCCCCATC ATCCCTGACA TCCCTATCGT GGACGCCCAG 4140 

AGCGGGGAGG ACTACGACAG CTTCCTTATG TACAGCGATG ACGTTCTACG CTCTCCATCG 42 00 

85 GGCAGCCAGA GGCCCAGCGT CTCCGATGAC ACTGAGCACC TGGTGAATGG CCGGATGGAC 42 60 

TTTGCCTTCC CGGGCAGCAC CAACTCCCTG CACAGGATGA CCACGACCAG TGCTGCTGCC 4320 

TATGGCACCC ACCTGAGCCC ACACGTGCCC CACCGCGTGC TAAGCACATC CTCCACCCTC 43 80 
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ACACGGGACT ACAACTCACT 
GACTACTCCA CCCTCACCTC 
GACACGCCCA CCCGCCTGGT 
CAGGAGCCGC GGTGCGAGCG 
GGCGGTGAGC TGCATCGGCT 
GACCTCCTGC CCAACCACTC 
GGCCGAGAGC GTGAGGGTGT 
TGTCCCCTGC CAGGCTCCGC 
TTCACTGCCC TGAGCCCAGA 
GGGGAT AT CG TCGGCTACCT 
GCATTCCGGG TGGATGGAGA 
AACGTGCCCT ACAAGTTCAA 
GAGGGCATCA TCACCATAGA 
GCCGGGCTCT TCCAGCACCC 
AGCGCCACCG AGCCCTTCCT 
GGCGGCTCCC TCACCCGGCA 
GGAACCCTTA GCACCCACAT 
CCCCCGCCAT GTCCCACTAG 
CCATCCTTGC ACCCCTGGGG 
TCCTGGGAGG CATGAAGGGG 
AAAGAGCTGG GAGCAGCACA 
ACTG 



GACCCGCTCA 
CGTCTCCTCC 
GTTCTCTGCC 
GCCGCTGCAG 
CAACATCCCC 
CTACGTGTTC 
CATCACCATT 
CTTCACTTTG 
CTCGCTGCAG 
GGTGACCTGT 
CAGCCCCGAG 
GGTGCAGGCC 
GTCCCAGGAT 
GCTGCAAAGC 
AGTGGATGGG 
TGTGACCCAG 
GGACCAACAG 
GCGTCCTCCC 
GCCCAGCCCA 
GCAAGGTCCG 
AGGACCCAGC 



GAACACTCAC 
CACGACTCTC 
CTGGGGCCCA 
GGCTACAGTG 
AACCCTGCCC 
CGCGTGCGGG 
GAATCCCAGG 
AGCACTCCCA 
CTGAGCTGGG 
GAGATGGCCC 
AGCCGGCTGA 
AGGACCACTG 
GGAGGACCCT 
GAGTACAGCA 
CCGACCCTGG 
GAGTTTGTGA 
TTCTTCCAAA 
GACTCCTCTC 
CCCGCATGCA 
TCCTCTGTGG 
CTTTGTTCTG 



ACTCGACCAC 
GCCTGACTGC 
CATCTCTCAG 
TGGAGTACCA 
AGACCTCGGT 
CCCAGAGCCA 
TGCACCCGCA 
GTGCCCCAGG 
AGCGGCCACG 
AAGGAGGAGG 
CCGTGCCGGG 
AGGGCTTCGG 
TCCCGCAGCT 
GCATCACCAC 
GGGCCCAGCA 
GCCGGACACT 
CTTGACCGCA 
CCGGAGCCTC 
CAGAGCAGGG 
GCCCAAACCT 
CACTTAATAA 



ACTGCCGAGG 4440 

TGGTGTGCCC 4500 

AGTGAGCTGG 4560 

GCTGCTGAAC 4620 

GGTGGTGGAA 4680 

GGAAGGCTGG 4740 

GAGCCCACTG 4800 

CCCGCTGGTG 4860 

GAGGCCCAAT 492 0 

GCCAGCCACC 4 98 0 

CCTCAGCGAG 5040 

GCCAGAGCGC 5100 

GGGCAGCCGT 5160 

CACCCACACC 522 0 

CCTGGAGGCA 52 80 

GACCACCAGC 5340 

CCCTGCCCCA 5400 

CTCAGCTACT 5460 

GCTAGGTGTC 5520 

ATTTGTAACC 5580 

ATGGTTTTGC 5640 



PCT/US02/12476 



25 Seq ID NO: 130 Protein sequence: 
Protein Accession #: NP 000204 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



I 

MAGPRPSPWA 
CNTQAELLAA 
EVFEPLESPV 
PQTDMRPEKL 
QTAVCTRDIG 
TQDYPSVPTL 
EAFNRIRSNL 
THVCQLPEDQ 
CSEGWSGQTC 
FQCPRTSGFL 
CHCHQQSLYT 
LKRAEEVWR 
LLPLLALLLL 
SGNLKGRDW 
AQLRQEVEEN 
LTEKQVEQRA 
LVEAIDVPAG 
KSQVSYRTQD 
VQLSNPKFGA 
RKIHFNWLPP 
AQGEGPYSSL 
NDDNRPIGPM 
KRPMSIPIIP 
FPGSTNSLHR 
STLTSVSSHD 
EIiHRLNIPNP 
LPGSAFTLST 
RVDGDSPESR 
LFQHPLQSEY 
LSTHMDQQFF 



11 

I 

RLLLAALISV 
GCQRESIWM 
DLYILMDFSN 
KEPWPNSDPP 
WRPDSTHLLV 
VRLLAKHNII 
DIRALDSPRG 
KGNIHLKPSF 
NCSTGSLSDI 
CNDRGRCSMG 
DTICEINYSA 
CSFRDEDDDC 
LCWKYCACCK 
RWKVTNNMQR 
LNEVYRQISG 
FHDLKVAPGY 
TATLGRRLVN 
GTAQGNRDYI 
HLGQPHSTTI 
SGKPMGYRVK 
VSCRTHQEVP 
KKVLVDNPKN 
DIPIVDAQSG 
MTTTSAAAYG 
SRLTAGVPDT 
AQTSVWEDL 
PSAPGPLVFT 
LTVPGLSENV 
SSITTTHTSA 
QT 



21 
I 

SLSGTLANRC 
ESSFQITEET 
SMSDDLDNLK 
FSFKNVISLT 
FSTESAFHYE 
PIFAVTNYSY 
LRTEVTSKMF 
SDGLKMDAGI 
Q P CLfREGEDK 
QCVCEPGWTG 
IHPGLCEDLR 
TYSYTMEGDG 
ACLALLPCCN 
PGFATHAASI 
VHKLQQTKFR 
YTLTADQDAR 
ITIIKEQARD 
PVEGELLFQP 
IIRDPDELDR 
YWIQGDSESE 
SEPGRLAFNV 
RMLLIENLRE 
EDYDSFLMYS 
THLSPHVPHR 
PTRLVFSALG 
LPNHSYVFRV 
ALSPDSLQLS 
PYKFKVQART 
TEPFLVDGPT 



31 

I 

KKAPVKSCTE 
QIDTTLRRSQ 
KMGQNLARVL 
EDVDE FRNKL 
ADGANVLAGI 
SYYEKLHTYF 
QKTRTGSFHI 
ICDVCTCELQ 
PCSGRGECQC 
PSCDCPLSNA 
SCVQCQAWGT 
APGPNSTVLV 
RGHMVGFKED 
NPTELVPYGL 
QQPNAGKKQD 
GMVEFQEGVE 
WSFEQPEFS 
GEAWKELQVK 
SFTSQMLSSQ 
AHLLDSKVPS 
VSSTVTQLSW 
SQPYRYTVKA 
DDVLRSPSGS 
VLSTSSTLTR 
PTSLRVSWQE 
RAQSQEGWGR 
WERPRRPNGD 
TEGFGPEREG 
LGAQHLEAGG 



41 
I 

CVRVDKDCAY 
MSPQGLRVRL 
SQLTSDYTIG 
QGERISGNLD 
MSRNDERCHL 
PVSSLGVLQE 
RRGEVGIYQV 
KEVRSARCSF 
GHCVCYGEGR 
TCIDSNGGIC 
GEKKGRTCEE 
HKKKDCPPGS 
HYMLRENLMA 
SLRLARLCTE 
HTIVDTVLMA 
LVDVRVPLFI 
VSRGDQVARI 
LLELQEVDSL 
PPPHGDLGAP 
VELTNLYPYC 
AEPAETNGE I 
RNGAGWGPER 
QRPSVSDDTE 
DYNSLTRSEH 
PRCERPLQGY 
EREGVITIES 
IVGYLVTCEM 
IITIESQDGG 
S1>TRHVTQEF 



51 
I 

CTDEMFRDRR 
RPGEERHFEL 
FGKFVDKVSV 
APEGGFDAIL 
DTTGTYTQYR 
DSSNIVELLE 
QLRALEHVDG 
NGDFVCGQCV 
YEGQFCEYDN 
NGRGHCECGR 
CNFKVKMVDE 
FWWIilPLLLIj 
SDHLDTPMLR 
NLLKPDTREC 
PRSAKPALLK 
RPEDDDEKQL 
P V I RRVLDGG 
LRGRQVRRFH 
QNPNAKAAGS 
DYEMKVCAYG 
TAYEVCYGLV 
EAIINLATQP 
HLVNGRMD FA 
SHSTTLPRDY 
SVEYQLLNGG 
QVHPQSPLCP 
AQGGGPATAF 
PFPQLGSRAG 
VSRTLTTSGT 



Seq ID NO: 131 DNA sequence 
Nucleic Acid Accession #: BC004372 
Coding sequence: 132.. 2231 



85 



1 
1 

CCTCGTGCCG 
GCCGGCCCCT 
CTCCGGACAC 
TGAGCCTGGC 
AGAAAAATGG 
ATAGCACCTT 
GCAGGTATGG 
GTGCAGCAAA 
ATTGCTTCAA 
ATGCCTTTGA 
AGAAAGGAGA 
ACGTGAGCAG 
CCTTTTCTAC 
ACAGAATCCC 
AAGAAAATGA 
ATGAAGATTT 
AGAACCAGGA 
CAACCACAAG 
ACCCAGAAGC 
ATTCTACAAG 
AGGAACAGTG 



11 
1 

CGGACCCCAG 
GCCCCGCGCC 
CATGGACAAG 
GCAGATCGAT 
TCGCTACAGC 
GCCCACAATG 
GTT CATAGAA 
CAACACAGGG 
TGCTTCAGCT 
TGGACCAATT 
ATACAGAACG 
CGGCTCCTCC 
TGTACACCCC 
TGCTACCAGT 
AGATGAAAGA 
TATCTCCAGC 
CTGGACCCAG 
GATGACTGAT 
ACACCCTCCC 
CACAATCCAG 
GTTTGGCAAC 



21 

I 

CCTCTGCCAG 
CAGGGATCCT 
TTTTGGTGGC 
TTGAATATAA 
ATCTCTCGGA 
GCCCAGATGG 
GGGCATGTGG 
GTGTACATCC 
CCACCTGAAG 
ACCATAACTA 
AATCCTGAAG 
AGTGAAAGGA 
ATCCCAGACG 
ACGTCTTCAA 
GACAGACACC 
ACCATTTCAA 
TGGAACCCAA 
GTAGACAGAA 
CTCATTCACC 
GCAACTCCTA 
AGATGGCATG 



31 , 
I 

GTTCGGTCCG 
CCAGCTCCTT 
ACGCAGCCTG 
CCTGCCGCTT 
CGGAGGCCGC 
AGAAAGCTCT 
TGATTCCCCG 
TCACATCCAA 
AAGATTGTAC 
TTGTTAACCG 
ACATCTACCC 
GCAGCACTTC 
AAGACAGTCC 
ATACCATCTC 
TCAGTTTTTC 
CCACACCACG 
GCCATTCAAA 
ATGGCACCAC 
ATGAGCATCA 
GTAGTACAAC 
AGGGATATCG 



41 



CCATCCTCGT 
TCGCCCGCGC 
GGGACTCTGC 
TGCAGGTGTA 
TGACCTCTGC 
GAGCATCGGA 
GATCCACCCC 
CACCTCCCAG 
ATCAGTCACA 
TGATGGCACC 
CAGCAACCCT 
AGGAGGTTAC 
CTGGATCACC 
AGCAGGCTGG 
TGGATCAGGC 
GGCTTTTGAC 
TCCGGAAGTG 
TGCTTATGAA 
TGAGGAAGAA 
GGAAGAAACA 
CCAAACACCC 



51 
I 

CCCGTCCTCC 
CCTCCGTTCG 
CTCGTGCCGC 
TTCCACGTGG 
AAGGCTTTCA 
TTTGAGACCT 
AACTCCATCT 
TATGACACAT 
GACCTGCCCA 
CGCTATGTCC 
ACTGATGATG 
ATCTTTTACA 
GACAGCACAG 
GAGCCAAATG 
ATTGATGATG 
CACACAAAAC 
CTACTTCAGA 
GGAAACTGGA 
GAGACCCCAC 
GCTACCCAGA 
AGAGAAGACT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 



238 



10 



15 



20 



WO 02/086443 

CCCATTCGAC AACAGGGACA 
GGACAACACC AAGCCCAGAG 
CCATGGGACG AGGTCATCAA 
CGCTTCAGCC TACTGCAAAT 
CTCTTTCAAT GACAACGCAG 
TGGAAGAAGA TAAAGACCAT 
TCACAGGTGG AAGAAGAGAC 
ATACCTCTCA TTACCCACAC 
AGACTGGGTC CTTTGGAGTT 
GTTCCTTATC AGGAGACCAA 
GATCTGAATC AGATGGACAC 
GTCCTATAAG GACACCCCAA 
TGGCTTTGAT TCTTGCAGTT 
AAAAGCTAGT GATCAACAGT 
ACGGAGAGGC CAGCAAGTCT 
CTCCAGACCA GTTTATGACA 
TTGGGGTGTA ACACGTACAC 
TACAGGGAGC TGGGACACTT 
TTTTTAGCAT AAAATTTTCT 



GCTGCAGCCT 
GACAGTTCCT 
GCAGGAAGAA 
CCAAACACAG 
CAGAGTAATT 
CCAACAACTT 
CCAAATCATT 
ACGAAGGAAA 
ACTGCAGTTA 
GACACATTCC 
TCACATGGGA 
ATTCCAGAAT 
TGCATTGCAG 
GG CAATGG AG 
CAGGAAATGG 
GCTGATGAGA 
CATTATCTTG 
AACAGATGCA 
ACTCTTAAAA 



CAGCTCATAC 
GGACTGATTT 
GGATGGATAT 
GTTTGGTGGA 
CTCAGAGCTT 
CTACTCTGAC 
CTGAAGGCTC 
GCAGGACCTT 
CTGTTGGAGA 
ACCCCAGTGG 
GTCAAGAAGG 
GGCTGATCAT 
TCAACAGTCG 
CTGTGGAGGA 
TGCATTTGGT 
CAAGGAACCT 
GAAAGAAACA 
ATGTGCTACT 
AAAAAAAAAA 



CAGCCATCCA 
CTTCAACCCA 
GGACTCCAGT 
AGATTTGGAC 
CTCTACATCA 
ATCAAGCAAT 
AACTACTTTA 
CATCCCAGTG 
TTCCAACTCT 
GGGGTCCCAT 
TGGAGCAAAC 
CTTGGCATCC 
AAGAAGGTGT 
CAGAAAGCCA 
GAACAAGGAG 
GCAGAATGTG 
ACCGTTGGAA 
GATTGTTTCA 
AAAAAAA 



ATGCAAGGAA 1320 

ATCTCACACC 1380 

CATAGTACAA 1440 

AGGACAGGAC 1500 

CATGAAGGCT 1560 

AGGAATGATG 1620 

CTGGAAGGTT 1680 

ACCTCAGCTA 1740 

AATGTCAATC 1800 

ACCACTCATG 1860 

ACAACCTCTG 1920 

CTCTTGGCCT 1980 

GGGCAGAAGA 2040 

AGTGGACTCA 2100 

TCGTCAGAAA 2160 

GACATGAAGA 2220 

ACATAACCAT 2280 

TTGCGAATCT 2340 



PCT/US02/12476 



Seq ID NO: 132 Protein sequence: 
Protein Accession #: AAH04372 



25 



30 



35 



40 



45 



50 



55 



60 



11 



21 



31 



MDKFWWHAAW 
PTMAQMEKAL 
ASAPPEEDCT 
GSSSERSSTS 
DERDRHLSFS 
MTDVDRNGTT 
FGNRWHEGYR 
GHQAGRRMDM 
KDHPTTSTLT 
FGVTAVTVGD 
TPQIPEWIiII 
SKSQEMVHLV 



GLCLVPLSLA 
SIGFETCRYG 
SVTDLPNAFD 
GGYIFYTFST 
GSGIDDDEDF 
AYEGNWNPEA 
QTPREDSHST 
DSSHSTTLQP 
SSNRNDVTGG 
SNSNVNRSLS 
liASLLALALI 
NKESSETPDQ 



QIDLNITCRF 
FIEGHWIPR 
GPITITIVNR 
VHPIPDEDSP 
ISSTISTTPR 
HPPLIHHEHH 
TGTAAASAHT 
TANPNTGLVE 
RRDPNHSEGS 
GDQDTFHPSG 
LAVCIAVNSR 
FMTADETRNL 



AGVFHVEKNG 
IHPNSICAAN 
DGTRYVQKGE 
WITDSTDRIP 
AFDHTKQNQD 
EEEETPHSTS 
SHPMQGRTTP 
DLDRTGPLSM 
TTLLEGYTSH 
GSHTTHGSES 
RRCGQKKKLV 
QNVDMKIGV 



41 
I 

RYSISRTEAA 
NTGVYILTSN 
YRTNPEDIYP 
ATSTSSNTIS 
WTQWNPSHSN 
TIQATPSSTT 
SPEDSSWTDF 
TTQQSNSQSF 
YPHTKESRTF 
DGHSHGSQEG 
INSGNGAVED 



51 
I 

DLCKAFNSTL 
TSQYDTYCFN 
SNPTDDDVSS 
AGWEPNEENE 
PEVLLQTTTR 
EETATQKEQW 
FNPISHPMGR 
STSHEGLEED 
IPVTSAKTGS 
GANTTSGPIR 
RKP SGLNGEA 



Seq ID NO: 133 DNA sequence 
Nucleic Acid Accession #: NM_002882 
Coding sequence: 150-755 



CGAGGTTCGG 
GCGGAGGGAA 
AGCCGAGCCG 
ATGATACTTC 
TTTCTCTTCC 
TGCGGGCAAA 
GCACTGGTGA 
GGAGGGACAA 
AGCCCAACGC 
AGTGCCCCAA 
TCAAAACAAA 
CAGG CAAAAA 
AGGAGACCAA 
TCTCTTTCCT 
ATTCTTTCAT 



11 

I 

GTCGTGGGGC 
GGAGCTACGA 
CCGCCGCCGC 
CACTGAGAAT 
TGAG CAAGAA 
ACTGTTCCGA 
CGTCAAGCTC 
GACCCTGAAG 
AGGTAGCGAC 
GCCAGAGCTG 
GTTTGAAGAA 
TGATCATGCC 
GGAGGATGCT 
TTCCTTTTTT 
TTTTACAAGG 



21 
I 

GGAGGGAAGA 
GTAGCCGCCG 
CGCGCCCCCA 
ACAGACGAGT 
ATTAAAACAC 
TTTGCCTCTG 
CTGAAGCACA 
ATCTGTGCCA 
CGTGCCTGGG 
CTGGCCATCC 
TGCAGGAAAG 
GAAAAAGTGG 
GAGGAGAAGC 
TAAAAAATTT 
GACGTTATAT 



31 
I 

GCGGGCGGGC 
AGAGGCCGCG 
TGGCGGCCGC 
CCAACCATGA 
TGGAAGAAGA 
AGAACGATCT 
AGGAGAAAGG 
ACCACTACAT 
TCTGGAACAC 
GCTTCCTGAA 
AGATCGAAGA 
CGGAAAAGCT 
AATAAATCGT 
TACCCTGCCC 
AAAGAACTGA 



41 
I 

GGGAGGCGCC 
GAGCCAGCGA 
CAAGGACACT 
CCCTCAGTTT 
TGAAGAGGAA 
CCCAGAATGG 
GGCCATCCGC 
CACGCCGATG 
CCACGCTGAC 
TGCTGAGAAT 
GAGAGAAAAG 
AGAAGCTCTC 
CTTATTTTAT 
CTCTTTTTCG 
ACTC 



51 
I 

GGCGCCAGAC 
CGACCGACCC 
CATGAGGACC 
GAGCCAATAG 
CTTTTTAAAA 
AAGGAGCGAG 
CTCCTCATGC 
ATGGAGCTGA 
TTCGCCGACG 
GCACAGAAAT 
AAAGCAGGAT 
TCGGTGAAGG 
TTTCTTTTCC 
GTTTGTTTTT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 



65 



Seq ID NO: 134 Protein sequence: 
Protein Accession #: NP 002873 



1 11 21 31 41 51 

1 I ! I I I 

MAAAKDTHED HDTSTENTDE SNHDPQFEPI VSLPEQEIKT LEEDEEELFK MRAKLFRFAS 

70 ENDLPEWKER GTGDVKLLKH KEKGAIRLLM RRDKTLKICA NHYI TPMMEL KPNAGSDRAW 

VWNTHADFAD ECPKPELLAI RFLNAENAQK FKTKFEECRK EIEEREKKAG SGKNDHAEKV 

AEKLEALSVK EETKEDAEEK Q 



60 
120 
180 



75 



80 



85 



Seq ID NO: 135 DNA sequence 

Nucleic Acid Accession #: NM_000077.2 

Coding sequence: 2 77-742 



CCCAACCTGG 
TCCTCCGAGC 
GGATTTGAGG 
GGGCTGGCTG 
GGAGAGCAGG 
GCCTTCGGCT 
GCTGCTGGAG 
GGTCATGATG 



11 
I 

GGCGACTTCA 
ACTCGCTCAC 
GACAGGGTCG 
GTCACCAGAG 
CAGCGGGCGG 
GACTGGCTGG 
GCGGGGGCGC 
ATGGGCAGCG 



21 
I 

GGTGTGCCAC 
GGCGTCCCCT 
GAGGGGGCTC 
GGTGGGGCGG 
CGGGGAGCAG 
CCACGGCCGC 
TGCCCAACGC 
CCCGAGTGGC 



31 
I 

ATTCGCTAAG 
TGCCTGGAAA 
TTCCGCCAGC 
ACCGCGTGCG 
CATGGAGCCG 
GGCCCGGGGT 
ACCGAATAGT 
GGAGCTGCTG 



41 
I 

TGCTCGGAGT 
GATACCGCGG 
ACCGGAGGAA 
CTCGGCGGCT 
GCGGCGGGGA 
CGGGTAGAGG 
TACGGTCGGA 
CTGCTCCACG 



51 
I 

TAATAGCACC 60 

TCCCTCCAGA 120 

GAAAGAGGAG 180 

GCGGAGAGGG 240 

GCAGCATGGA 300 

AGGTGCGGGC 360 

GGCCGATCCA 420 

GCGCGGAGCC 480 



239 



WO 02/086443 

CAACTGCGCC GACCCCGCCA CTCTCACCCG ACCCGTGCAC GACGCTGCCC GGGAGGGCTT 
CCTGGACACG CTGGTGGTGC TGCACCGGGC CGGGGCGCGG CTGGACGTGC GCGATGCCTG 
GGGCCGTCTG CCCGTGGACC TGGCTGAGGA GCTGGGCCAT CGCGATGTCG CACGGTACCT 
GCGCGCGGCT GCGGGGGGCA CCAGAGGCAG TAACCATGCC CGCATAGATG CCGCGGAAGG 
TCCCTCAGAC ATCCCCGATT GAAAGAACCA GAGAGGCTCT GAGAAACCTC GGGAAACTTA 
GATCAT CAGT CACCGAAGGT CCTACAGGGC CACAACTGCC CCCGCCACAA CCCACCCCGC 
TTTCGTAGTT TTCATTTAGA AAATAGAGCT TTTAAAAATG TCCTGCCTTT TAACGTAGAT 
ATATGCCTTC CCCCACTACC GTAAATGTCC ATTTATATCA TTTTTTATAT ATT CTTATAA 
AAATGTAAAA AAGAAAAACA CCGCTTCTGC CTTTTCACTG TGTTGGAGTT TTCTGGAGTG 
•AGCACTCACG CCCTAAGCGC ACATTCATGT GGGCATTTCT TGCGAGCCTC GCAGCCTCCG 
GAAGCTGTCG ACTTCATGAC AAGCATTTTG TGAACTAGGG AAGCTCAGGG GGGTTACTGG 
CTTCTCTTGA GTCACACTGC TAGCAAATGG CAGAACCAAA GCTCAAATAA AAATAAAATA 
ATTTTCATTC ATT C ACT C 

Seq ID NO: 136 Protein sequence: 
Protein Accession #: NP_000068.1 

1 11 21 

l I l 

MEPAAGSSME PSADWLATAA ARGRVEEVRA 
ELLLLHGAEP NCADPATLTR PVHDAAREGF 
LGHRDVARYL RAAAGGTRGS NHAR I DAAEG 



31 41 51 

I I I 

LLEAGALPNA PNSYGRRPIQ VMMMGSARVA 

LDTLWLHRA GARLDVRDAW GRIiPVDLAEE 
PSDIPD 



Seq ID NO: 137 DNA sequence 

Nucleic Acid Accession #: NM_058196.1 

Coding sequence: 104-421 



1 11 21 31 41 51 

I I I l l I 

TGTGTGGGGG TCTGCTTGGC GGTGAGGGGG CTCTACACAA GCTTCCTTTC CGTCATGCCG 
GCCCCCACCC TGGCTCTGAC CATTCTGTTC TCTCTGGCAG GTCATGATGA TGGGCAGCGC 
CCGAGTGGCG GAGCTGCTGC TGCTCCACGG CGCGGAGCCC AACTGCG CCG ACCCCGCCAC 
TCTCACCCGA CCCGTGCACG ACGCTGCCCG GGAGGGCTTC CTGGACACGC TGGTGGTGCT 
GCACCGGGCC GGGGCGCGGC TGGACGTGCG CGATGCCTGG GGCCGTCTGC CCGTGGACCT 
GGCTGAGGAG CTGGGCCATC GCGATGTCGC ACGGTACCTG CGCGCGGCTG CGGGGGGCAC 
CAGAGGCAGT AACCATGCCC GCATAGATGC CGCGGAAGGT CCCTCAGACA TCCCCGATTG 
AAAGAACCAG AGAGGCTCTG AGAAACCTCG GGAAACTTAG ATCATCAGTC ACCGAAGGTC 
CTACAGGGCC ACAACTGCCC CCGCCACAAC CCACCCCGCT TTCGTAGTTT TCATTTAGAA 
AATAGAGCTT TTAAAAATGT CCTGCCTTTT AACGTAGATA TAAGCCTTCC CCCACTACCG 
TAAATGTCCA TTT AT AT CAT TTTTTATATA TTCTTATAAA AATGTAAAAA AGAAAAACAC 
CGCTTCTGCC TTTTCACTGT GTTGGAGTTT TCTGGAGTGA GCACTCACGC CCTAAGCGCA 
CATTCATGTG GGCATTTCTT GCGAGCCTCG CAGCCTCCGG AAGCTGTCGA CTTCATGACA 
AGCATTTTGT GAACTAGGGA AGCTCAGGGG GGTTACTGGC TTCTCTTGAG TCACACTGCT 
AGCAAATGGC AGAACCAAAG CTCAAATAAA AATAAAATAA TTTTCATTCA TTCACTC 



Seq ID NO: 138 Protein sequence: 
Protein Accession #: NP_47 8103.1 

1 11 21 31 41 51 

l l I I I I 

MMMGSARVAE LLLLHGAEPN CADPATLTRP VHDAAREGFL DTLWLHRAG ARLDVRDAWG 
RliPVDLAEEL GHRDVARYLR AAAGGTRGSN HARIDAAEGP SDIPD 

Seq ID NO: 13 9 DNA sequence 

Nucleic Acid Accession #: NM_058197.1 

Coding sequence: 2 72-684 

1 11 21 31 41 51 

I 1 1 1 1 i 

CCCAACCTGG GGCGACTTCA GGTGTGCCAC ATT CGCTAAG TGCTCGGAGT TAATAGCACC 

TCCTCCGAGC ACTCGCTCAC GGCGTCCCCT TGCCTGGAAA GATACCGCGG TCCCTCCAGA 

GGATTTGAGG GACAGGGTCG GAGGGGGCTC TTCCGCCAGC ACCGGAGGAA GAAAGAGGAG 

GGGCTGGCTG GTCACCAGAG GGTGGGGCGG ACCGCGTGCG CTCGGCGGCT GCGGAGAGGG 

GGAGAGCAGG CAGCGGGCGG CGGGGAGCAG CATGGAGCCG GCGGCGGGGA G CAGCATGGA 

GCCGGCGGCG GGGAGCAGCA TGGAGCCTTC GGCTGACTGG CTGGCCACGG CCGCGGCCCG 

GGGTCGGGTA GAGGAGGTGC GGGCGCTGCT GGAGGCGGGG GCGCTGCCCA ACGCACCGAA 

TAGTTACGGT CGGAGGCCGA TCCAGGTGGG TAGAAGGTCT GCAGCGGGAG CAGGGGATGG 

CGGGCGACTC TGGAGGACGA AGTTTGCAGG GGAATTGGAA TCAGGTAGCG CTTCGATTCT 

CCGGAAAAAG GGGAGGCTTC CTGGGGAGTT TTCAGAAGGG GTTTGTAATC ACAGACCTCC 

TCCTGGCGAC GCCCTGGGGG CTTGGGAAAC CAAGGAAGAG GAATGAGGAG CCACGCGCGT 

ACAGATCTCT CGAATGCTGA GAAGATCTGA AGGGGGGAAC ATATTTGTAT TAGATGGAAG 

TCATGATGAT GGGCAGCGCC CGAGTGGCGG AGCTGCTGCT GCTCCACGGC GCGGAGCCCA 

ACTGCGCCGA CCCCGCCACT CTCACCCGAC CCGTGCACGA CGCTGCCCGG GAGGGCTTCC 

TGGACACGCT GGTGGTGCTG CACCGGGCCG GGGCGCGGCT GGACGTGCGC GATGCCTGGG 

GCCGTCTGCC CGTGGACCTG GCTGAGGAGC TGGGCCATCG CGATGTCGCA CGGTACCTGC 

GCGCGGCTGC GGGGGGCACC AGAGGCAGTA ACCATGCCCG CATAGATGCC GCGGAAGGTC 

CCTCAGACAT CCCCGATTGA AAGAACCAGA GAGGCTCTGA GAAACCTCGG GAACTTAGAT 

CAT CAGT C A C CGAAGGT CCT ACAGGGCCAC AACTGCCCCC GCCACAACCC ACCCCGCTTT 

CGTAGTTTTC ATTTAGAAAA TAGAGCTTTT AAAAATGTCC TGCCTTTTAA CGTAGATATA 

TGCCTTCCCC CACTACCGTA AATGTCCATT TATATCATTT TTTATATATT CTTATAAAAA 

TGTAAAAAAG AAAAACACCG CTTCTGCCTT TTCACTGTGT TGGAGTTTTC TGGAGTGAGC 

ACTCACGCCC TAAGCGCACA TTCATGTGGG CATTTCTTGC GAGCCTCGCA GCCTCCGGAA 

GCTGTCGACT TCATGACAAG CATTTTGTGA ACTAGGGAAG CTCAGGGGGG TTACTGGCTT 

CTCTTGAGTC ACACTG CTAG CAAATGGCAG AACCAAAGCT CAAATAAAAA TAAAATAATT 



240 



WO 02/086443 

TTCATTCATT CACTC 



PCT/US02/12476 



Seq ID NO: 140 Protein sequence: 
Protein Accession #: NP 478104.1 



10 



1 11 21 31 41 SI 

I I I I I I 

MEPAAGSSME PAAGSSMEPS ADWLATAAAR GRVEEVRALIi EAGALPNAPN SYGRRPIQVG 

RRSAAGAGDG GRLWRTKFAG ELESGSASIL RKKGRIiPGEF SEGVCNHRPP PGDALGAWET 

KEEE 



60 
120 



15 



Seq ID NO: 141 DNA sequence 

Nucleic Acid Accession #: NM_058195 . 1 

Coding sequence: 163-684 



20 



25 



30 



35 



40 



1 
1 

CCTCCCTACG 
GATCTTGGAG 
GGGCGCGCTC 
GTGGGTCCCA 
GGCGGCGCAG 
TTGGTGACCC 
CACATCCCGC 
GTGCTGATGC 
CATGATGATG 
CTGCGCCGAC 
GGACACGCTG 
CCGTCTGCCC 
CGCGGCTGCG 
CTCAGACATC 
CATCAGTCAC 
CGTAGTTTTC 
TGCCTTCCCC 
TGTAAAAAAG 
ACTCACGCCC 
GCTGTCGACT 
CTCTTGAGTC 
TTCATTCATT 



11 
I 

GGCGCCTCCG 
GTCCGGGTGG 
AGGGAAGGCG 
GTCTGCAGTT 
CGGCTGCCGA 
TCCGGATTCG 
GGCTCACGGG 
TACTGAGGAG 
GGCAGCGCCC 
CCCGCCACTC 
GTGGTGCTGC 
GTGGACCTGG 
GGGGGCACCA 
CCCGATTGAA 
CGAAGGT CCT 
ATTTAGAAAA 
CACTACCGTA 
AAAAACACCG 
TAAGCGCACA 
TCATGACAAG 
ACACTGCTAG 
CACTC 



21 
i 

GCAGCCCTTC 
GAGTGGGGGT 
GGTGCGCGCC 
AAGGGGGCAG 
GCTCGGCCCT 
GCGCGCGTGC 
GGAGTGGGCA 
CCAGCGTCTA 
GAGTGGCGGA 
TCACCCGACC 
ACCGGGCCGG 
CTGAGGAGCT 
GAGGCAGTAA 
AGAACCAGAG 
ACAGGGCCAC 
TAGAGCTTTT 
AATGTCCATT 
CTTCTGCCTT 
TTCATGTGGG 
CATT TTGTGA 
CAAATGGCAG 



31 
i 

CCGCGTGCGC 
GGGGTGGGGG 
TGCGGGGCGG 
GAGTGGCGCT 
GGAGGCGGCG 
GGCCCGCCGC 
GCGCCAGGGG 
GGGCAGCAGC 
GCTGCTGCTG 
CGTGCACGAC 
GGCGCGGCTG 
GGGCCAT CGC 
CCATGCCCGC 
AGGCTCTGAG 
AACTGCCCCC 
AAAAATGTCC 
TAT AT CATTT 
TTCACTGTGT 
CATTTCTTGC 
ACTAGGGAAG 
AACCAAAGCT 



41 
1 

AGGGCTCAGA 
TGGGGGTGAA 
AGATGGGCAG 
GCTCACCTCT 
AGAACATGGT 
GAGTGAGGGT 
CGCCCGCCGC 
CGCTTCCTAG 
CTCCACGGCG 
GCTGCCCGGG 
GACGTGCGCG 
GATGTCGCAC 
ATAGATGCCG 
AAACCTCGGG 
GCCACAACCC 
TGCCTTTTAA 
TTTATATATT 
TGGAGTTTTC 
GAGCCTCGCA 
CTCAGGGGGG 
CAAATAAAAA 



51 
1 

GCCGTTCCGA 60 

GGTGGGGGGC 12 0 

GGGGCGGTGC 180 

GGTGCCAAAG 240 

GCGCAGGTTC 300 

TTTCGTGGTT 3 60 

TGTGGCCCTC 420 

AAGACCAGGT 480 

CGGAGCCCAA 540 

AGGGCTTCCT 60 0 

ATGCCTGGGG 660 

GGTACCTGCG 720 

CGGAAGGTCC 780 

AAACTTAGAT 840 

ACCCCGCTTT 90 0 

CGTAGATATA 960 

CTTATAAAAA 102 0 

TGGAGTG AG C 1080 

GCCTCCGGAA 1140 

TTACTGGCTT 12 00 

TAAAATAATT 1260 



Seq ID NO: 142 Protein sequence: 
Protein Accession ft: NP 478102.1 



45 



50 



55 



60 



65 



70 



75 



80 



1 11 21 31 41 51 

I I I I I I 

MGRGRCVGPS LQLRGQEWRC S PL VPKGGAA AAELGPGGGE NMVRRFLVTL RIRRACGPPR 
VRVFWHIPR LTGEWAAPGA PAAVALVLML LRSQRLGQQP LPRRPGHDDG QRPSGGAAAA 
PRRGAQLRRP RHSHPTRARR CPGGLPGHAG GAAPGRGAAG RARCLGPSAR GPG 

Seq ID NO: 143 DNA sequence 
Nucleic Acid Accession #: NM_018131 
Coding sequence: 412.. 1107 



85 



GAAATTGCAC 
GATAAAGAGA 
AATGCTTATC 
GCCAGATATA 
AGGAGGGAGC 
TCTGCTGCAA 
CAGACTGTGG 
CAGCTGAAAG 
GTCTATGTAA 
GCTCATTCAC 
AAGCAGAAAT 
CAAACCATAA 
CAAAAAGAAG 
CATCTGGAAG 
ATTGCTAGGG 
CAGTCTCTTT 
GAACAACAGA 
GTGCAGCATC 
GTTGGAATCC 
AGGAGAGACT 
CAATGGAAGC 
CGATCTGCTT 
TTAAAAGATT 
CATTTTGCAT 
CTTTTAGGCT 
GGCTGCAATG 
AAAATACTTG 
GCAAAATATT 
ACTGTGTTCG 
ATTGTTAAGA 



11 
I 

ACTTAAAGAC 
GACAGAGACT 
AACTCACAGA 
GTACTACCGC 
AGGTGTTGAA 
CCTCACGAAT 
CTCCAAACTG 
ATGCTCTGGA 
AAGGACTTTT 
TCCCACAGCA 
GTTACAACGA 
CTCAGCTGAG 
TTCACAATTT 
ATGATAGGCA 
GAAAACTTGA 
ACACATCTCT 
TGCAGGCATG 
AATTGCATGT 
TTGAAACAGC 
GAAAACAGAG 
CTGGTGGAAT 
GTCCATGTGG 
CAATACTGTA 
AAAACTGCCT 
GCTGTGCATT 
ACAGAATGTG 
GTGAGGAAAA 
TTATGTTTCG 
CATTTTTTAT 
GGTGGTGATA 



21 



31 



ATCAGTGGAT 
TTTGGAGAAA 
GAAGGACAAA 
ATTGCTTGAA 
AGCCTTATCT 
TGCTGAACTT 
CTTCAACTCA 
G AAAAAT C AG 
AGCAAAGATC 
GACAAAAAAG 
TCTCTTGGCA 
TTTTGAACTG 
AAAT CAGCTG 
TAAAACAGAG 
AGAAGAGAAG 
GCTAAAGCAG 
TACTTTAGAC 
AATTCTTAAG 
TTCATGAGTT 
AAAAAGTTGC 
GTCCCAAGTG 
AATACTGTTC 
TTTTCTGTTA 
ATCTACCTTT 
TCTCTTGGCA 
GTGAGCAGCG 
GATAGCTCAG 
GGGGTTTTGA 
CCAAGCACTT 
GATACTATTT 



GAAATCACAA 
ATTCGAGTCC 
GAAATACAGC 
CAGCTGGAAG 
GAAGAGAAAG 
GAAAGCAAAA 
TCAATAAATA 
CAGTGGCTCG 
TTTGAGTTGG 
CCTGAATCAG 
AGTGCAAAAA 
AGTGAATTTC 
TTGTATTCAC 
AAGATACAAA 
AAGAGATCCG 
CAAGAAGAAC 
TTTGAAAATG 
GAGCTCCGAA 
TGCCATCACA 
CGCCTCACCA 
CAATATACAG 
AAAGTAGCAA 
GCTTGTGGGC 
GACACTCCAG 
GTGATACCTC 
TCTACTGAGA 
GTTATTGCTA 
AAAATCAAAG 
AGAAAACCTA 
TTTTTTCATA 



41 

I 

GTGGGAAAGG 
TTGAGGCTGA 
GACTGAGAGA 
AGACAACGAG 
ACGTATTGAA 
CCAATACACT 
ATATTCATGA 
TGTATGATCA 
AAAAGAAAAC 
AAGGTTATCT 
AAGATCTTGA 
GAAGAAAATA 
AAAGAAGGGC 
AACTCAGGGA 
AAGAGCTCTT 
AAACAAGGGT 
AAAAACT CG A 
AAGCAAGAAA 
GAGCCATTAG 
AAAAGTCCCA 
TAT CCAG CCA 
AATAAGTATT 
ATTTTGAATT 
CATGCTAGTG 
CCTGACATGG 
TACTAACATT 
ATGGGTTAAT 
ATAATTAACC 
CAATCCTAAT 
TTGTATAGCG 



51 
I 

AAAGCTGACT 
GAAGGAGAAG 
CCAACTGAAG 
AGAAGGAGAA 
ACAACAGTTG 
CCGTTTATCA 
AATGGAAATA 
GCAGCGGGAA 
GGAAACAGCT 
TCAAGAAGAG 
GGTTGAACGA 
TGAAGAAACC 
AGATGTGCAA 
AGAGAATGAT 
ATCTCAGGTC 
AGCTCTGTTG 
CCGT CAACAT 
AAAT AA CACA 
TCACTTTCCA 
CTGCTGCACT 
CTGAGCATCG 
TGTTTTGATA 
ATATATTTCA 
AATCATGTAT 
TTCATCATCA 
TTGCACTGTC 
G CACCAG CAA 
AAGGATCTTA 
TTTGATGTCC 
GTTATTAGAA 



60 
120 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 



241 



10 



WO 02/086443 PCT/US02/12476 

AAGTTGGGGA TTTTCTTGAT CTTTATTGCT GCTTACCATT GAAACTTAAC CCAGCTGTGT 1860 

TCCCCAACTC TGTTCTGCGC ACGAAACAGT ATCTGTTTGA GGCATAATCT TAAGTGGCCA 1920 

CACACAATGT TTTCTCTTAT GTTATCTGGC AGTAACTGTA ACTTGAATTA CATTAGCACA 1980 

TTCTGCTTAG CTAAAATTGT TAAAATAAAC TTTAATAAAC CCATGTAGCC CTCTCATTTG 2 040 

ATTGACAGTA TTTTAGTTAT TTTTGGCATT CTTAAAGCTG GGCAATGTAA TGATCAGATC 2100 

TTTGTTTGTC TGAACAGGTA TTTTTATACA TGCTTTTTGT AAACCAAAAA CTTTTAAATT 2160 

TCTTCAGGTT TTCTAACATG CTTACCACTG GGCTACTGTA AATGAGAAAA GAATAAAATT 2220 
ATTTAATGTT TT 

Seq ID NO: 144 Protein sequence: 
Protein Accession #: NP 060601 



25 



60 



65 



70 



15 1 11 21 31 41 SI 

I I I I I I 

MEIQL.KDALE KNQQVJLVYDQ QREVYVKGLL AKIFELEKKT ETAAHSLPQQ TKKPESEGYL 60 

QEEKQKCYND LLASAKKDLE VERQTITQLS FELSEFRRKY EETQKEVHNL NQLLYSQRRA 120 

DVQHLEDDRH KTEKIQKLRE ENDIARGKLE EEKKRSEELL SQVQSLYTSL LKQQEEQTRV 180 

20 ALLEQQMQAC TLDFENEKLD RQHVQHQLHV ILKELRKARK NNTVGIL.ETA S 



Seq ID NO: 145 DNA sequence 
Nucleic Acid Accession #: NM_001168 
Coding sequence: 50.. 478 



1 11 21 31 41 51 

I I I I I 1 

CCGCCAGATT TGAATCGCGG GACCCGTTGG CAGAGGTGGC GGCGGCGGCA TGGGTGCCCC 60 

30 GACGTTGCCC CCTGCCTGGC AGCCCTTTCT CAAGGACCAC CGCATCTCTA CATTCAAGAA 120 

CTGGCCCTTC TTGGAGGGCT GCGCCTGCAC CCCGGAGCGG ATGGCCGAGG CTGGCTTCAT 180 

CCACTGCCCC ACTGAGAACG AG CCAGACTT GGCCCAGTGT TTCTTCTGCT TCAAGGAGCT 240 

GGAAGGCTGG GAGCCAGATG ACGACCCCAT AGAGGAACAT AAAAAGCATT CGTCCGGTTG 3 00 

CGCTTTCCTT TCTGTCAAGA AGCAGTTTGA AGAATTAACG CTTGGTGAAT TTTTGAAACT 3 60 

35 GGACAGAGAA AGAGCCAAGA ACAAAATTGC AAAGGAAACC AACAATAAGA AGAAAGAATT 420 

TGAGGAAACT GCGAAGAAAG TGCGCCGTGC CAT CGAGCAG CTGGCTGCCA TGGATTGAGG 480 

CCTCTGGCCG GAGCTGCCTG GTCCCAGAGT GGCTGCACCA CTTCCAGGGT TTATTCCCTG 540 

GTGCCACCAG CCTTCCTGTG GGCCCCTTAG CAATGTCTTA GGAAAGGAGA TCAACATTTT 600 

CAAATTAGAT GTTTCAACTG TGCTCCTGTT TTGTCTTGAA AGTGGCACCA GAGGTGCTTC 660 

40 TGCCTGTGCA GCGGGTGCTG CTGGTAACAG TGGCTGCTTC TCTCTCTCTC TCTCTTTTTT 72 0 

GGGGGCTCAT TTTTGCTGTT TTGATTCCCG GGCTTACCAG GTGAGAAGTG AGGGAGGAAG 7 80 

AAGGCAGTGT CCCTTTTGCT AGAGCTGACA GCTTTGTTCG CGTGGGCAGA GCCTTCCACA 840 

GTGAATGTGT CTGGACCTCA TGTTGTTGAG GCTGTCACAG TCCTGAGTGT GGACTTGGCA 900 

GGTGCCTGTT G AATCTGAGC • TGCAGGTTCC TTATCTGTCA CACCTGTGCC TCCTCAGAGG 960 

45 ACAGTTTTTT TGTTGTTGTG TTTTTTTGTT TTTTTTTTTT GGTAGATGCA TGACTTGTGT 1020 

GTGATGAGAG AATGGAGACA GAGTCCCTGG CTCCTCTACT GTTTAACAAC ATGGCTTTCT 1080 

TATTTTGTTT GAATTGTTAA TTCACAGAAT AGCACAAACT ACAATTAAAA CTAAGCACAA 1140 

AGCCATTCTA AGT CATTGGG GAAACGGGGT GAACTTCAGG TGGATGAGGA GACAGAATAG 1200 

AGTGATAGGA AGCGTCTGGC AGATACTCCT TTTGCCACTG CTGTGTGATT AGACAGGCCC 12 60 

50 AGTGAGCCGC GGGGCACATG CTGGCCGCTC CTCCCTCAGA AAAAGGCAGT GGCCTAAATC 132 0 

CTTTTTAAAT GACTTGGCTC GATGCTGTGG GGGACTGGCT GGGCTGCTGC AGGCCGTGTG 1380 

TCTGTCAGCC CAACCTTCAC ATCTGTCACG TTCTCCACAC GGGGGAGAGA CGCAGTCCGC 1440 

CCAGGTCCCC GCTTTCTTTG GAGGCAGCAG CTCCCGCAGG GCTGAAGTCT GGCGTAAGAT 1500 

GATGGATTTG ATTCGCCCTC CTCCCTGTCA TAGAGCTGCA GGGTGGATTG TTACAGCTTC 1560 

55 GCTGGAAACC TCTGGAGGTC ATCTCGGCTG TTCCTGAGAA AT AAAAAG C C TGTCATTTC 



Seq ID NO: 146 Protein sequence: 
Protein Accession #: NP_001159 

1 11 21 31 41 51 

I I I I 1 I 

MGAPTLPPAW QPFLKDHRIS TFKNWPFLEG CACTPERMAE AGFIHCPTEN EPDLAQCFFC 60 
FKELEGWEPD DDP I EEHKKH SSGCAFLSVK KQFEELTLGE FLKLDRERAK NK I AKETNNK 120 
KKEFEETAKK VRRAI EQLAA MD 

Seq ID NO: 147 DNA sequence 

Nucleic Acid Accession #: NM_014176.1 

Coding sequence: 12 7-72 0 



1 11 21 31 41 51 • 

I I I I I I 

GCGCGCAGCG CTGGTACCCC GTTGGTCCGC GCGTTGCTGC GTTGTGAGGG GTGTCAGCTC 60 

AGTGCATCCC AGGCAGCTCT TAGTGTGGAG CAGTGAACTG TGTGTGGTTC CTTCTACTTG 120 

75 GGGATCATGC AGAGAGCTTC ACGTCTGAAG AGAGAGCTGC ACATGTTAGC CACAGAGCCA 180 

CCCCCAGGCA TCACATGTTG G CAAG AT AAA GACCAAATGG ATGACCTGCG AGCTCAAATA 240 

TTAGGTGGAG CCAACACACC TTATGAGAAA GGTGTTTTTA AGCTAGAAGT TATCATTCCT 300 

GAGAGGTACC CATTTGAACC TCCTCAGATC CGATTTCTCA CTCCAATTTA TCATCCAAAC 360 

ATTGATTCTG CTGGAAGGAT TTGTCTGGAT GTTCTCAAAT TGCCACCAAA AGGTGCTTGG 420 

80 AG AC CAT CCC TCAACATCGC AACTGTGTTG ACCTCTATTC AGCTGCTCAT GTCAGAACCC 480 

AACCCTGATG ACCCGCTCAT GGCTGACATA TCCTCAGAAT TTAAATATAA TAAGCCAGCC 540 

TTCCTCAAGA ATGCCAGACA GTGGACAGAG AAGCATGCAA GACAGAAACA AAAGGCTGAT 600 

GAGGAAGAGA TGCTTGATAA TCTACCAGAG GCTGGTGACT CCAGAGTACA CAACTCAACA 660 

CAGAAAAGGA AGGCCAGTCA GCTAGTAGGC ATAGAAAAGA AATTTCATCC TGATGTTTAG 720 

85 GGGACTTGTC CTGGTTCATC TTAGTTAATG TGTTCTTTGC CAAGGTGATC TAAGTTGCCT 7 80 

ACCTTGAATT. TTTTTTTAAA TATATTTGAT GACATAATTT TTGTGTAGTT TATTTATCTT 840 

GTACATATGT ATTTTGAAAT CTTTTAAACC TGAAAAATAA ATAGTCATTT AATGTTGAAA 900 



242 



WO 02/086443 

AAAAAAAAAA AAAAAAAAAA AAAAAAAA 



PCT/US02/12476 



Seq ID NO: 148 Protein sequence: 
_ Protein Accession #: NP 054895.1 

5 

1 11 21 31 41 51 

I I I I I I 

MQRASRLKRE LHMLATEPPP GITCWQDKDQ MDDLRAQILG GANTPYEKGV FKLEVIIPER 60 

YPFEPPQIRF LTPIYHPNID SAGRICLDVL KLPPKGAWRP SLNIATVLTS IQLLMSEPNP 120 

10 DDPLMADISS EFKYNKPAFL KNARQWTEKH ARQKQKADEE EMLDNLPEAG DSRVHNSTQK 180 
RKASQLVGIE KKFHPDV 

Seq ID NO: 14 9 DNA sequence 
Nucleic Acid Accession ft: NM_003812 
15 Coding sequence: 224-2722 

1 11 21 31 41 51 

I I I 1 I I 

TCCTCTGCGT CCCGCCCCGG GAGTGGCTGC GAGGCTAGGC GAGCCGGGAA AGGGGGCGCC 60 

20 GCCCAGCCCC GAGCCCCGCG CCCCGTGCCC CGAGCCCGGA GCCCCCTGCC CGCGGCGGCA 12 0 

CCATGCGCGC CGAGCCGGCG TGACCGGCTC CGCCCGCGGC CGCCCCGCAG CTAGCCCGGC 180 

GCTCTCGCCG GCCACACGGA GCGGCGCCCG GGAGCTATGA GCCATGAAGC CGCCCGGCAG 240 

CAGCTCGCGG CAGCCGCCCC TGGCGGGCTG CAGCCTTGCC GGCGCTTCCT GCGGCCCCCA 3 00 

ACGCGGCCCC GCCGGCTCGG TGCCTGCCAG CGCCCCGGCC CGCACGCCGC CCTGCCGCCT 3 60 

25 GCTTCTCGTC CTTCTCCTGC TGCCTCCGCT CGCCGCCTCG TCCCGGCCCC GCGCCTGGGG 420 

GGCTGCTGCG CCCAGCGCTC CGCATTGGAA TGAAACTGCA GAAAAAAATT TGGGAGTCCT 480 

GGCAGATGAA GACAATACAT TGCAACAGAA TAGCAGCAGT AATATCAGTT ACAGCAATGC 540 

AATGCAGAAA GAAATCACAC TGCCTTCAAG ACTCATATAT TACATCAACC AAGACTCGGA 600 

AAGCCCTTAT CACGTTCTTG ACACAAAGGC AAGACACGAG CAAAAACATA ATAAGGCTGT 660 

30 CCATCTGGCC CAGGCAAGCT TCCAGATTGA AGCCTTCGGC TCCAAATTCA TTCTTGACCT 72 0 

CATACTGAAC AATGGTTTGT TGTCTTCTGA TTATGTGGAG ATTCACTACG AAAATGGGAA 780 

ACCACAGTAC TCTAAGGGTG GAGAGCACTG TTACTACCAT GGAAGCATCA GAGGCGTCAA 840 

AGACT CCAAG GTGGCTCTGT CAACCTGCAA TGGACTTCAT GGCATGTTTG AAGATGATAC 90 0 

CTTCGTGTAT ATGATAGAGC CACTAGAGCT GGTTCATGAT GAGAAAAGCA CAGGTCGACC 960 

35 ACATATAATC CAGAAAACCT TGGCAGGACA GTATTCTAAG CAAATGAAGA ATCTCACTAT 1020 

GGAAAGAGGT GACCAGTGGC CCTTTCTCTC TGAATTACAG TGGTTGAAAA GAAGGAAGAG 10 80 

AG CAGTG AAT CCATCACGTG GTATATTTGA AGAAATGAAA TATTTGGAAC TTATGATTGT 114 0 

TAATGATCAC AAAACGTATA AGAAGCATCG CTCTTCTCAT GCACATACCA ACAACTTTGC 12 00 

AAAGTCCGTG GTCAACCTTG TGGATT CTAT TTACAAGGAG CAGCTCAACA CCAGGGTTGT 12 60 

40 CCTGGTGGCT GTAGAGACCT GGACTGAGAA GGATCAGATT GACATCACCA CCAACCCTGT 132 0 

GCAGATGCTC CATGAGTTCT CAAAATACCG GCAGCGCATT AAGCAGCATG CTGATGCTGT 1380 

GCACCTCATC TCGCGGGTGA CATTTCACTA TAAGAGAAGC AGTCTGAGTT ACTTTGGAGG 1440 

TGTCTGTTCT CGCACAAGAG GAGTTGGTGT GAATGAGTAT GGTCTTCCAA TGGCAGTGGC 150 0 

ACAAGTATTA TCGCAG AG CC TGGCTCAAAA CCTTGGAATC CAATGGGAAC CTTCTAGCAG 1560 

45 AAAGCCAAAA TGTGACTGCA CAGAATCCTG GGGTGGCTGC ATCATGGAGG AAACAGGGGT 162 0 

GTCCCATTCT CGAAAATTTT CAAAGTGCAG CATTTTGGAG TATAGAGACT TTT TACAGAG 1680 

AGGAGGTGGA GCCTGCCTTT TCAACAGGCC AACAAAGCTA TTTGAGCCCA CGGAATGTGG 1740 

AAATGGATAC GTGGAAGCTG GGGAGGAGTG TGATTGTGGT TTTCATGTGG AATGCTATGG 18 0 0 

ATTATGCTGT AAGAAATGTT CCCTCTCCAA CGGGGCTCAC TGCAGCGACG GGCCCTGCTG 1860 

50 TAACAATACC TCATGTCTTT TTCAGCCACG AGGGTATGAA TGCCGGGATG CTGTGAACGA 192 0 

GTGTGATATT ACTGAATATT GTACTGGAGA CTCTGGTCAG TGCCCACCAA ATCTTCATAA 1980 

GCAAGACGGA TATGCATGCA ATCAAAATCA GGGCCGCTGC TACAATGGCG AGTGCAAGAC 2 04 0 

CAGAGACAAC CAGTGTCAGT ACATCTGGGG AACAAAGGCT GCAGGGT CTG ACAAGTTCTG 2100 

CTATGAAAAG CTGAATACAG AAGGCACTGA GAAGGGAAAC TGCGGGAAGG ATGGAGACCG 2160 

55 GTGGATTCAG TGCAGCAAAC ATGATGTGTT CTGTGGATTC TTACTCTGTA CCAATCTTAC 222 0 

TCGAGCTCCA CGTATTGGTC AACTTCAGGG TGAGATCATT CCAACTTCCT TCTACCATCA 2280 

AGGCCGGGTG ATTGACTGCA GTGGTGCCCA TGTAGTTTTA GATGATGATA CGGATGTGGG 2340 

CTATGTAGAA GATGGAACGC CATGTGGCCC GTCTATGATG TGTTTAGATC GGAAGTGCCT 240 0 

ACAAATTCAA GCCCTAAATA TGAGCAGCTG TCCACTCGAT TCCAAGGGTA AAGTCTGTTC 2460 

60 GGGCCATGGG GTGTGTAGTA ATGAAGCCAC CTGCATTTGT GATTTCACCT GGGCAGGGAC 2520 

AGATTGCAGT ATCCGGGATC CAGTTAGGAA CCTTCACCCC CCCAAGGATG AAGGACCCAA 2580 

GGGTCCTAGT GCCACCAATC TCATAATAGG CTCCATCGCT GGTGCCATCC TGGTAGCAGC 2640 

TATTGTCCTT GGGGGCACAG GCTGGGGATT TAAAAATGTC AAGAAGAGAA GGTTCGATCC 2700 

TACTCAGCAA GGCCCCATCT GAATCAGCTG CGCTGGATGG ACACCGCCTT GCACTGTTGG 2 760 

65 ATTCTGGGTA TGACATACTC GCAGCAGTGT TAGTGGAACT ATTAAGTTTG TAAACAAAAC 2 82 0 

CTTTGGGTGG TAATGACTAC GGAGCTAAAG TTGGGGTGAC AAGGATGGGG TAAAAGAAAA 2880 

CTGTCTCTTT TGGAAATAAT GTCAAAGAAC ACCTTTCACC ACCTGTCAGT AAACGGGGGA 2 940 

GGGGGCAAAA GACCATGCTA TAAAAAGAAC TGTT CCAGAA TCTTTTTTTT TCCCTAATGG 3000 
ACGAAGGAAC AACACACACA CAAAAATTAA ATGCAATAAA GGAATCATTA AAAA 



70 



Seq ID NO: 150 Protein sequence: 
Protein Accession #: NP 003803 



75 i 11 21 31 41 51 

1 I I I I 1 

MKPPGSSSRQ PPLAGCSLAG ASCGPQRGPA GSVPASAPAR TPPCRLLLVL LLLPPDAASS 60 

RPRAWGAAAP SAPHWNETAE KNLGVLADED NTLQQNSSSN ISYSNAMQKE ITLPSRLIYY 120 

INQDSESPYH VLDTKARHQQ KHNKAVHLAQ ASFQIEAFGS KFILDLILNN GLLSSDYVEI 180 

80 HYENGKPQYS KGGEHCYYHG SIRGVKDSKV ALSTCNGLHG MFEDDTFVYM IEPLELVHDE 240 

KSTGRPHIIQ KTLAGQYSKQ MKNLTMERGD QWPFLSELQW IiKRRKRAVNP SRGIFEEMKY 300 

LELMIVNDHK TYKKHRSSHA HTNNFAKSW NLVDSIYKEQ LNTRWLVAV ETWTEKDQID 360 

ITTNPVQMLH EFSKYRQRIK QHADAVHLIS RVTFHYKRSS LSYFGGVCSR TRGVGVNEYG 420 

LPMAVAQVLS QSLAQNLGIQ WEPSSRKPKC DCTESWGGCI MEETGVSHSR KFSKCSILEY 480 

85 RDFLQRGGGA CLFNRPTKLF EPTECGNGYV EAGEECDCGF HVECYGLCCK KCSLSNGAHC 540 

SDGPCCNNTS CLFQPRGYEC RD AVNE CD I T EYCTGDSGQC PPNLHKQDGY ACNQNQGRCY 600 

NGECKTRDNQ CQYIWGTKAA GSDKFCYEKL NTEGTEKGNC GKDGDRWIQC SKHDVFCGFL 660 



243 



WO 02/086443 

LCTNLTRAPR IGQLQGEIIP TSFYHQGRVI DCSGAHWLD DDTDVGYVED GTPCGPSMMC 
LDRKCLQIQA LNMSSCPLDS KGKVCSGHGV CSNEATCICD FTWAGTDCSI RDPVRNLHPP 
KDEGPKGPSA TNLI IGSIAG AILVAAIVLG GTGWGFKNVK KRRFDPTQQG PI 
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15 
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Seq ID NO: 151 DNA sequence 
Nucleic Acid Accession NM_023915 
Coding sequence: 250-1326 



11 



21 



31 



35 



GGCACGAGGG 
TCAAAGCTTA 
GTGAATGGAC 
CCCACGCCTC 
AACTGAAGAA 
CAAGAGAGTC 
AATGAATTTG 
TTGCTGAATG 
TTCTATCTCA 
ATAGTCCATG 
TCAGTTTTGT 
GATCGCTATC 
ACGAAGGTTT 
ATCCTGACAA 
CCTTTGGGGG 
GTGCTGGTGA 
AGGCAATTCA 
GTGGCTGTGT 
AGTCACTTAG 
AT T AC ACT T T 
TGTAGGTCAT 
ATCAGATCAC 
GTGTAGGCCT 
TTCATTATCC 



TTTCGTTTTC 
TTCTTAATTA 
AGCCAGCCAC 
AATCGTCCCC 
TGGGGTTCAA 
ACAATTCAGG 
ACACAATTGT 
GTTTAGCAGT 
AAAACATAGT 
ATGCAGGATT 
TTTATGCAAA 
TGAAGGTGGT 
TATCTGTTTG 
ATGGTCAGCC 
TCAAATGGCA 
TTCTGATCGG 
TAAGTCAGTC 
TTTTTACCTG 
ACAGGCTTTT 
TCTTGTCTGC 
TTTCAAGAAG 
TGCAAAGTGT 
TTTATTGTTT 
TTAAAAAAAA 



ATGCTTTACC 
GAGACAAGAA 
CACAATGAAA 
AAGTGTTTCC 
CTTGACGCTT 
CAACAGGAGC 
CTTGCCGGTG 
GTGGATCTTC 
GGTTGCAGAC 
TGGACCTTGG 
CATGTATACT 
CAAGCCATTT 
TGTTTGGGTG 
AACAGAGGAC 
TACGGCAGTC 
ATGTTACATA 
AAGCCGAAAG 
CTTTCTACCA 
AGATGAATCT 
GTGTAATGTT 
GCTGTTCAAA 
GAGAAGATCG 
GTTGGAATCG 
AA 



AG AAAAT CCA 
ACCTGTTTCA 
GAAATCAAAC 
TGACACGCAT 
GCAAAATTAC 
GACGGGCCAG 
CTTTATCTCA 
TTCCACATTA 
CTCATAATGA 
TACTTCAAGT 
TCCAT CGTGT 
GGGGACTCTC 
ATCATGG CTG 
AATATCCATG 
ACCTATGTGA 
GCCATATCCA 
CGAAAACATA 
TATCACTTGT 
GCACAAAAAA 
TGCCTGGATC 
AAATCAAATA 
GAAGTTCGCA 
ATATGTACAA 



41 
1 

CTTCCCTGCC 
ACTTGAAGAC 
CAGGAATAAC 
CTTTGCTTAC 
CAAATAACGA 
GAAAGAACAC 
TTATATTTGT 
GGAATAAAAC 
CGCTGACATT 
TTATTCTCTG 
TCCTTGGGCT 
GGATGTACAG 
TTTTGTCTTT 
ACTGCTCAAA 
ACAGCTGCTT 
GGTACAT CCA 
ACCAGAGCAT 
GCAGAATTCC 
TCCTATATTA 
CAATAATTTA 
TCAGAACCAG 
TATATTATGA 
AGTGTAAATA 



51 



GACCTTAGTT 60 

ACCGTATGAG 120 

CTATGCTGAA 180 

AGTGCATCAC 240 

GCTGCACGGC 30 0 

CACCCTTCAC 3 60 

GGCAAGCATC 42 0 

CAGCTTCATA 480 

TCCATTTCGA 540 

CAGATACACT 600 

GATAAGCATT 660 

CATAACCTTC 72 0 

GCCAAACATC 7 80 

ACTTAAAAGT 840 

GTTTGTGGCC 900 

CAAATCCAGC 960 

CAGGGTTGTT 102 0 

TTTTACTTTT 1080 

CTGCAAAGAA 1140 

CTTTTTCATG 12 00 

GAGTGAAAGC 12 60 

TT ACACTGAT 1320 

AATGTTTCTT 13 80 



Seq ID NO: 152 Protein sequence: 
Protein Accession #: NP_076404 

40 1 11 21 31 41 51 

! I ! I I I 

MGFNLTLAKL PNNELHGQES HNSGNRSDGP GKNTTLHNEF DTIVLPVLYL IIFVASIDLN 60 

GLAVWIFFHI RNKTSFIFYL KNIWADLIM TDTFPFRIVH DAGFGPWYFK FILCRYTSVL 120 

FYANMYTSIV FLGLISIDRY DKWKPFGDS RMYSITFTKV LSVCVWVIMA VLSLPNIII/T 180 

45 NGQPTEDNIH DCSKLKSPLG VKWHTAVTYV NSCLFVAVLV ILIGCYIAIS RYIHKSSRQF 240 

ISQSSRKRKH NQSIRVWAV FFTCFLPYHL CRIPFTFSHL DRLLDESAQK ILYYCKEITL 3 00 

FLSACNVCLD PIIYFFMCRS FSRRLFKKSN IRTRSESIRS LQSVRRSEVR IYYDYTDV 



Seq ID NO: 153 DNA sequence 
50 Nucleic Acid Accession #: D80008.1 
Coding sequence: 149-739 

1 11 21 31 41 51 

« I 1 ) I 1 I 

J>J GTTCGGCGCC AAAGCGCGGA GCGGAGGCCG AGG CG AG AG C CTGGCGCTGT AGGACTAGAA 60 

CGAAAGGAGT GAGGCGCCGA GAGCCCAGAT ACCATTTTGG CGTGAGAGCT GGTGGTTGGC 120 

AAGGCCGCGG GAGTGGGAAG CGTCCGCCAT GTTCTGCGAA AAAGCCATGG AACTGATCCG 180 

CGAGCTGCAT CGCGCGCCCG AAGGGCAACT GCCTGCCTTC AACGAGGATG GACTCAGACA 24 0 

AGTTCTGGAG GAGATGAAAG CTTTGTATGA ACAAAACCAG TCTGATGTGA ATGAAGCAAA 3 00 

60 GTCAGGTGGA CGAAGTGATT TGATACCAAC TATCAAATTT CGACACTGTT CTCTGTTAAG 3 60 

AAATCGACGC TGCACTGTAG CATACCTGTA TGACCGCTTG CT T CG GAT CA GAGCACTCAG 420 

ATGGGAATAT GGTAGCGTCT TGCCAAATGC ATTACGATTT CACATGGCTG CTGAAGAAAT 4 80 

GGAGTGGTTT AATAATTATA AAAGATCTCT TG CTACTT AT ATGAGGTCAC TGGGAGGAGA 540 

TGAAGGTTTG GACATTACAC AGGATATGAA ACCACCAAAA AG CCTAT ATA TTGAAGTCCG 600 

65 GTGTCTAAAA GACTATGGAG AATTTGAAGT TGATGATGGC ACTTCAGTCC TATTAAAAAA 660 

AAATAGCCAG CACTTTTTAC CT CGATGGAA ATGTGAGCAG CTGATCAGAC AAGGAGTCCT 720 

GGAGCACATC CTGTCATGAC CATGCGCCGA GGCACTTCCA GGCTTCACTC AACTCATGGA 780 

CTCCTCTGTA CTCACTCTCT CCACCACTCC CTTCACCTCC CTCTTTGATT TTAGAAGCTA 840 

TAGACATTGT TTAAGATAAC TAAGAATACT TGGCTAAGAA GTATAATTTG CTAACTATTA 900 

70 AGGACTTTCT TTTTTTAATG TTGTACACTA TTCTTCCTAC TCTTTTTTGG TTTTGGTTTT 960 

GTTTTGTAGA GACTGTCTCA CTATGTTGCC CAAGCTGGTC TCAAACT CCT GGCCTCAAGC 102 0 

AGTCCTCCCA CCTTAGCTTC TCAAAGTGTT GAGATCACAG GCGTGAG CCA CTGCACCCGG 10 80 

CCCCTACTCC TTTTTCTAAT AAGCTGTATC TGTAATCACA GCATTCCTAC AGTTGTTACA 1140 

GTGTGTTTTT TAAATGAAAG TAAACATGGT TACATTTGAA TCTCTTAAAT AAGCAGTCAC 1200 

75 TTGGCTGGAC AGGAAGAAGG TAGATCCTGT GTGTCTTGTT TTCTGGTCAT GTGTATTGTA 1260 

CAAGCTAGAG AGCTGAATTT CTGAGATACA CATTTTCAAA TCACATGCAA GTGAAGATGA 132 0 

TGGTCTGTAG AAATTTTCAG TATATATAAT GTTTAATGAC AT ACTAAT T T ATCATCTGGC 13 80 

TATTTGGGAA GGAAGGACAC ACATGGATTT TGCACATTTC CACCATGGTG GCTGGTGTGG 1440 

CTTGTGGCTA TGGGGTGATC ACCAGTATCA CCACTTTGGA AGGGGACAGT GAAATTGGGG 1500 

80 CTAGAGAAGG AACTTTGTAC AGTTTTCCCT GAGATTCAGA TTGACTGAAA AGTCACATGA 1560 

AGAGTTGATT GTCTTTTAAT GGTATGTTTT AAACAGCTGA CATTTTAAAT TTTGATGAAA 162 0 

TCCAGTTTAT TCGTTTGTTC TTTTATGCTT TGGGTGTTGC ATCCGAGAAA TCTTTTCCCA 168 0 

TCCCAAGATC ACAATTTTTT TTCCTTTTTA CTTCTAGAAG TGTTATAATT TTAAGCTTTA 1740 

TACTTTGGTC TATGACCCGT TTTTTTTTTT GTTTTGTTTT GTTTTTTCGT TTGTTTCTTT 180 0 

85 GTTTTGAGAT GGAGTCTTGT TCTGTCACCC AGGCTGGGGT GCAGTGGCGT GATCTTGGCT 1860 

CACTGCAATC TCTATCCCCT GGGTTCAAGT GATTCTCTTG TCTCAGCCTC CCAAGTAGCT 1920 

GGGATTACAG GCACAGGCCG CCACGCCTGG CTAATTTTTG TATTTTTAGT AGAGACAGAG 1980 
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80 



WO 02/086443 

TTTTACCATG TTGGCCAGGC 
CCCAAAGTTT TGGGATTACA 
GAATTTTTTA TATGGTGCAA 
TCCAGCTGTT TCACTACCAT 
TTTGTTAAAA AGTAGTTGTC 
ATTGACCTGT TTTTCTCTCC 
TCTAATAATT CTTGAAACAG 
TTTGTAGAGA TGGGGTTTCA 
ATACACTTGC CTCGTCCTCC 
CAGTGTACCA CATTTCTTTT 
GTGAAATTTG GGAACAGGCA 
GGCCTAGATG GGTGGATCAC 
AACTCCGTCT CTACAAAAAA 
CACAGTTACA CGGCAGGCTG 
GTGAGCTGAG ATCACACCAC 
AAAGAAATTA GGATCAATTT 
CACCTTGATT GAGATTGCAT 
AATATTGAGT CTTCTGGCCT 
TCTATTTCTC TTAATAATCT 
CATAGTTTTG ATGCTAAATG 
AATAGAAATA CAATTGATGT 
ATGGTGTTTT TGTAAATTAC 
TTC 



TGGTTTCAAA 
AGTGTGGGCC 
GGTGTCAATC 
TTTTTGAAAG 
AATGTATATG 
TGAATGCCAA 
ATAGTATTAA 
CCGTGTTGGC 
CCATGTGCTG 
TGAGATTTGT 
GGGTGTGGTG 
TTGAG CTCAG 
TAGAAAAAAT 
AGGTGGGAGG 
TGT ACT CC AG 
GTCAATTTCT 
TGAATTTATA 
ATAAACAAGG 
TTTGTAGTTT 
GTATTTTAAA 
TGAACTTGTA 
ATCAACAGTC 



CTCCTGACCT 
ACCGCGGCCA 
CACCTTCACT 
GACTGCCCTT 
TGGGTTTATT 
TACCATATTT 
TGTGT CAT AT 
CAGGCTGTGT 
GGATTACAGG 
TTTGGCTATG 
GCTTATGCCT 
GAGTTCCAGA 
TAGCCAGGTG 
AT CACTTGAA 
CCTGGGTGAC 
ACAACAACAA 
TAAAACTGTT 
TCTGTCTTCC 
TCAGTGTACA 
ATTTCAAATT 
TCCTTCAGCC 
ATGTGTTCTA 



CAAGTGACCC 
GCCTATGATC 
TTTTCTTGGG 
TGCTCTATCA 
TCAGGACTCT 
GTATGTAGTG 
TTTTGCTGTT 
TGAACTCCTG 
CGTGAGCCTT 
TTAAGTCCTT 
GTAATCCTAG 
CCAGCCCGGG 
TGGTGGTGCA 
CCCCAGAGGT 
AAAGTGAGAC 
CAACAAAAAC 
GGGAGAATTG 
TAGGTATTAA 
GGTCTACCAT 
CTAACCACTT 
TTGCTAAACT 
TGAATAAAGA 



ACCTTGGCCT 
CATTTTGAAT 
AATATAGATA 
CCTTTGCATT 
GTTTTGTTCC 
TATGTAATTT 
GTTTGTATTT 
AGCTAAAGCA 
GGTGCTGGCC 
TGCTTTTGAT 
AACTTTGGGA 
CCTATGGCAA 
TGCCTGTAGT 
CAAGACTGCA 
TCTATCTCAA 
CCCTGTTGGG 
ACATCTTAAT 
TGTTTTGTCT 
GTCAGCATTT 
GTTG CTAGTA 
GTGAGTTCTC 
GTTTTACTCC 



Seq ID NO; 154 Protein sequence: 
Protein Accession #: BAA11503.1 

1 11 21 31 41 51 

I I I i I I 

MFCEKAMELI RELHRAPEGQ LPAFNEDGLR QVLEEMKALY EQNQSDVNEA KSGGRSDLIP 

TIKFRHCSLIi RNRRCTVAYli YDRLLRIRAL RWEYGSVLPN ALRFHMAAEE MEWFNNYKRS 

LATYMRSLGG DEGLDITQDM KPPKSLYIEV RCLKDYGEFE VDDGTSVLLK KNSQHFLPRW 

KCEQLIRQGV LiEHILS 

Seq ID NO: 155 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 14 9-709 



85 



GTTCGGCGCC 
CGAAAGGAGT 
AAGGCCGCGG 
CGAGCTGCAT 
AGTTCTGGAG 
GTCAGGTGGA 
AAATCGACGC 
ATGGGAATAT 
GGAGTGGTTT 
TGAAGGTTTG 
ATGCAGTGGC 
CAACCTCCAC 
GCACTTCAGT 
AGCTGATCAG 
CAGGCTTCAC 
CCCTCTTTGA 
AAGTATAATT 
ACTCTTTTTT 
TCTCAAACTC 
AGGCGTGAGC 
CAGCATTCCT 
AATCTCTTAA 
TTTTCTGGTC 
AATCACATGC 
ACATACTAAT 
TCCACCATGG 
GAAGGGGACA 
GATTGACTGA 
GACATTTTAA 
GCATCCGAGA 
AGTGTTATAA 
TTGTTTTTTC 
GTGCAGTGGC 
TGTCTCAGCC 
TGTATTTTTA 
C T CAAGTG AC 
CAGCCTATGA 
CTTTTTCTTG 
TTTGCTCTAT 
TTTCAGGACT 
TTGTATGTAG 
ATTTTTGCTG 
GTTGAACTCC 
GGCGTGAGCC 
TGTTAAGTCC 
CTGTAATCCT 
GACCAGCCCG 



11 
I 

AAAGCGCGGA 
GAGGCGCCGA 
GAGTGGGAAG 
CGCGCGCCCG 
GAGATGAAAG 
CGAAGTGATT 
TGCACTGTAG 
GGTAGCGTCT 
AATAATTATA 
GACATTACAC 
GCGATCTCGG 
CTCCCAGGTC 
CCTATTAAAA 
ACAAGGAGTC 
TCAACTCATG 
TTTTAGAAGC 
TGCTAACTAT 
GGTTTTGGTT 
CTGGCCTCAA 
CACTGCACCC 
ACAGTTGTTA 
AT AAGCAGT C 
ATGTGTATTG 
AAGTGAAGAT 
TTATCATCTG 
TGGCTGGTGT 
GTGAAATTGG 
AAAGTCACAT 
ATTTTGATGA 
AATCTTTTCC 
TTTTAAGCTT 
GTTTGTTTCT 
GTGATCTTGG 
TCCCAAGTAG 
GTAGAGACAG 
CCACCTTGGC 
TCCATTTTGA 
GGAATATAGA 
CACCTTTGCA 
CTGTTTTGTT 
TGTATGTAAT 
TTGTTTGTAT 
TGAGCTAAAG 
TTGGTGCTGG 
TTTGCTTTTG 
AGAACTTTGG 
GGCCTATGGC 



21 
i 

GCGGAGGCCG 
GAGCCCAGAT 
CGTCCGCCAT 
AAGGGCAACT 
CTTTGTATGA 
TGATACCAAC 
CATACCTGTA 
TGCCAAATGC 
AAAGATCTCT 
AGGATATGAA 
CTCAACCTGC 
CGGTGTCTAA 
AAAAATAGCC 
CTGGAGCACA 
GACTCCTCTG 
TATAGACATT 
TAAGGACTTT 
TTGTTTTGTA 
GCAGTCCTCC 
GGCCCCTACT 
CAGTGTGTTT 
ACTTGG CTGG 
TACAAGCTAG 
GATGGTCTGT 
GCTATTTGGG 
GGCTTGTGGC 
GGCTAGAGAA 
GAAGAGTTGA 
AATCCAGTTT 
CATCCCAAGA 
TATACTTTGG 
TTGTTTTGAG 
CTCACTGCAA 
CTGGGAT TAC 
AGTTTTACCA 
CTCCCAAAGT 
ATGAATTTTT 
TATCCAGCTG 
TTTTTGTTAA 
CCATTGACCT 
TTTCTAATAA 
TTTTTGTAGA 
CAATACACTT 
CCCAGTGTAC 
ATGTGAAATT 
GAGGCCTAGA 
AAAACTCCGT 



31 
I 

AGGCGAGAGC 
ACCATTTTGG 
GTTCTGCGAA 
GCCTGCCTTC 
ACAAAACCAG 
TATCAAATTT 
TGACCGCTTG 
ATTACGATTT 
TGCTACTTAT 
ACCACCAAAA 
AACCTCCACC 
AAGACTATGG 
AGCACTTTTT 
TCCTGTCATG 
TACTCACTCT 
GTTTAAGATA 
CTTTTTTTAA 
GAGACTGTCT 
CACCTTAGCT 
CCTTTTTCTA 
TTTAAATGAA 
ACAGGAAGAA 
AGAGCTGAAT 
AGAAATTTTC 
AAGGAAGGAC 
TATGGGGTGA 
GGAACTTTGT 
TTGTCTTTTA 
ATTCGTTTGT 
TCACAATTTT 
TCTATGACCC 
ATGGAGTCTT 
TCTCTATCCC 
AGGCACAGGC 
TGTTGGCCAG 
TTTGGGATTA 
TATATGGTGC 
TTTCACTACC 
AAAGTAGTTG 
GTTTTTCTCT 
TTCTTGAAAC 
GATGGGGTTT 
GCCTCGTCCT 
CACATTTCTT 
TGGGAACAGG 
TGGGTGGATC 
CTCTACAAAA 



41 
1 

CTGGCGCTGT 
CGTGAGAGCT 
AAAGCCATGG 
AACGAGGATG 
TCTGATGTGA 
CGACACTGTT 
CTTCGGATCA 
CACATGGCTG 
ATGAGGTCAC 
AGCCTATATA 
TCCCAGGTTC 
AGAATTTGAA 
ACCTCGATGG 
ACCATGCGCC 
CTCCACCACT 
ACTAAGAATA 
TGTTGTACAC 
CACTATGTTG 
TCTCAAAGTG 
ATAAGCTGTA 
AGTAAACATG 
GGTAGATCCT 
TTCTGAGATA 
AGTATATATA 
ACACATGGAT 
TCACCAGTAT 
ACAGTTTTCC 
ATGGTATGTT 
TCTTTTATGC 
TTTTCCTTTT 
T ^* T T TT T 
GTTCTGTCAC 
CTGGGTTCAA 
CGCCACGCCT 
GCTGGTTTCA 
CAAGTGTGGG 
AAGGTGTCAA 
ATTTTTTGAA 
TCAATGTATA 
CCTGAATGCC 
AGATAGTATT 
CACCGTGTTG 
CCCCATGTGC 
TTTGAGATTT 
CAGGGTGTGG 
ACTTGAGCTC 
AATAGAAAAA 



51 
I 

AGGACTAGAA 
GGTGGTTGGC 
AACTGATCCG 
GACTCAGACA 
ATGAAGCAAA 
CTCTGTTAAG 
GAGCACT CAG 
CTGAAGAAAT 
TGGGAGGAGA 
TTGAAGCTGG 
ACCTCAACTG 
GTTGATGATG 
AAATGTGAGC 
GAGGCACTTC 
CCCTTCACCT 
CTTGGCTAAG 
TATTCTTCCT 
CCCAAGCTGG 
TTGAGAT CAC 
TCTGTAATCA 
GTTACATTTG 
GTGTGTCTTG 
CACATTTTCA 
ATGTTTAATG 
TTTGCACATT 
CACCACTTTG 
CTGAGATTCA 
TTAAACAGCT 
TTTGGGTGTT 
TACTTCTAGA 
TTGTTTTGTT 
CCAGGCTGGG 
GTGATTCTCT 
GGCTAATTTT 
AACTCCTGAC 
CCACCGCGGC 
TCCACCTTCA 
AGGACTGCCC 
TGTGGGTTTA 
AATACCATAT 
AATGTGTCAT 
GCCAGGCTGT 
TGGGATTACA 
GTTTTGGCTA 
TGGCTTATGC 
AGGAGTTCCA 
ATTAGCCAGG 
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60 
120 
180 
240 
300 
360 
42 0 
480 
540 
600 
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780 
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900 
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1020 
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1140 
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2400 
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2520 
2580 
2640 
2700 
2760 
2820 



245 



10 



WO 02/086443 

TGTGGTGGTG CATGCCTGTA 
AACCCCAGAG GTCAAGACTG 
ACAAAGTGAG ACTCTATCTC 
AACAACAAAA ACCCCTGTTG 
TTGGGAGAAT TGACATCTTA 
CCTAGGTATT AATGTTTTGT 
CAGGTCTACC ATGTCAGCAT 
TTCTAACCAC TTGTTGCTAG 
CCTTGCTAAA CTGTGAGTTC 
TATGAATAAA GAGTTTTACT 



GTCACAGTTA 
CAGTGAGCTG 
AAAAAGAAAT 
GGCACCTTGA 
ATAATATTGA 
CTTCTATTTC 
TTCATAGTTT 
TAAATAGAAA 
TCATGGTGTT 
CCTTC 



CACGGCAGGC 
AGATCACACC 
TAGGATCAAT 
TTGAGATTGC 
GTCTTCTGGC 
TCTTAATAAT 
TGATGCTAAA 
TACAATTGAT 
TTTGTAAATT 



TGAGGTGGGA 
ACTGTACTCC 
TTGTCAATTT 
ATTGAATTTA 
CTATAAACAA 
CTTTTGTAGT 
TGGTATTTTA 
GTTGAACTTG 
ACATCAACAG 



GGATCACTTG 2880 

AGCCTGGGTG 2 940 

CTACAACAAC 3000 

TATAAAACTG 3060 

GGTCTGTCTT 3120 

TTTCAGTGTA 318 0 

AAATTTCAAA 3240 

TATCCTTCAG 33 00 

TCATGTGTTC 3360 
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Seq ID NO: 156 Protein sequence: 
Protein Accession #: Eos sequence 

1 11 21 31 41 51 

I I 1 I I I 

MFCEKAMELI REIiHRAPEGQ LPAFNEDGLR QVLEEMKALY EQNQSDVNEA KSGGRSDLIP 
TIKFRHCSLL RNRRCTVAYL YDRLLRIRAL RWEYGSVLPN ALRFHMAAEE MEWFNNYKRS 
LATYMRSLGG DEGLDITQDM KPPKSLYIEA GCSGAISAQP ATSTSQVHLN CNLHLPGPVS 
KRLWRI 

Seq ID NO: 157 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 148-621 



I 



11 



21 



31 



41 



51 



I 



80 



TTCGGCGCCA 
GAAAGGAGTG 
AGGCCGCGGG 
GAGCTGCATC 
GTTCTGGAGG 
TCAGGTGGAC 
AATCGACGCT 
TGGGAATATG 
CGGTGT CTAA 
AAAAAT AG CC 
CTGGAGCACA 
GACTCCTCTG 
TATAGACATT 
TAAGGACTTT 
TTGTTTTGTA 
GCAGTCCTCC 
GGCCCCTACT 
CAGTGTGTTT 
ACTTGGCTGG 
TACAAGCTAG 
GATGGT CTGT 
GCTATTTGGG 
GGCTTGTGGC 
GGCTAGAGAA 
GAAGAGT TG A 
AAT CCAGTTT 
CATCCCAAGA 
TATACTTTGG 
TTGTTTTGAG 
CTCACTGCAA 
CTGGGATTAC 
AGTTTTACCA 
CTCCCAAAGT 
ATGAATTTTT 
TATCCAGCTG 
TTTTTGTTAA 
CCATTGACCT 
TTTCTAATAA 
TTTTTGTAGA 
CAATACACTT 
CCCAGTGTAC 
ATGTGAAATT 
GAGGCCTAGA 
AAAACTCCGT 
GTCACAGTTA 
CAGTGAGCTG 
AAAAAGAAAT 
GGCACCTTGA 
ATAATATTGA 
CTTCTATTTC 
TTCATAGTTT 
TAAATAGAAA 
TCATGGTGTT 
CCTTC 



AAGCGCGGAG 
AGGCGCCGAG 
AGTGGGAAGC 
GCGCGCCCGA 
AGATGAAAGC 
GAAGTGATTT 
GCACTGTAGC 
GTAGCGTCTT 
AAGACTATGG 
AGCACTTTTT 
TCCTGT CATG 
T ACT CACT CT 
GTTTAAGATA 
CTTTTTTTAA 
GAGACTGTCT 
CACCTTAGCT 
CCTTTTTCTA 
TTTAAATGAA 
ACAGGAAGAA 
AGAGCTGAAT 
AGAAATTTTC 
AAGGAAGGAC 
TATGGGGTGA 
GGAACTTTGT 
TTGTCTTTTA 
ATTCGTTTGT 
TCACAATTTT 
TCTATGACCC 
ATGGAGTCTT 
TCTCTATCCC 
AGGCACAGGC 
TGTTGGCCAG 
TTTGGGATTA 
TATATGGTGC 
TTTCACTACC 
AAAGTAGTTG 
GTTTTTCTCT 
TTCTTGAAAC 
GATGGGGTTT 
GCCTCGTCCT 
CACATTTCTT 
TGGGAACAGG 
TGGGTGGATC 
CTCTACAAAA 
CACGGCAGGC 
AGATCACACC 
TAGGATCAAT 
TTGAGATTGC 
GTCTTCTGGC 
TCTTAATAAT 
TGATGCTAAA 
TACAATTGAT 
TTTGTAAATT 



CGGAGGCCGA 
AGCCCAGATA 
GTCCGCCATG 
AGGGCAACTG 
TTTGTATGAA 
GATACCAACT 
ATACCTGTAT 
GCCAAATGCA 
AGAATTTGAA 
ACCTCGATGG 
ACCATGCGCC 
CTCCACCACT 
ACTAAGAATA 
TGTTGTACAC 
CACTATGTTG 
TCTCAAAGTG 
ATAAGCTGTA 
AGTAAACATG 
GGTAGATCCT 
TTCTGAGATA 
AGTATATATA 
ACACATGGAT 
TCACCAGTAT 
ACAGTTTTCC 
ATGGTATGTT 
TCTTTTATGC 
TTTTCCTTTT 
GTTTTTTTTT 
GTTCTGTCAC 
CTGGGTTCAA 
CGCCACGCCT 
GCTGGTTTCA 
CAAGTGTGGG 
AAGGTGTCAA 
ATTTTTTGAA 
TCAATGTATA 
CCTGAATGCC 
AGATAGTATT 
CACCGTGTTG 
CCCCATGTGC 
TTTGAGATTT 
CAGGGTGTGG 
ACTTGAGCTC 
AATAGAAAAA 
TGAGGTGGGA 
ACTGTACTCC 
TTGTCAATTT 
ATTGAATTTA 
CTATAAACAA 
CTTTTGTAGT 
TGGTATTTTA 
GTTGAACTTG 
ACATCAACAG 



GGCGAGAGCC 
CCATTTTGGC 
TTCTGCGAAA 
CCTGCCTTCA 
CAAAACCAGT 
ATCAAATTTC 
GACCGCTTGC 
TTACGATTTC 
GTTGATGATG 
AAATGTGAGC 
GAGGCACTTC 
CCCTTCACCT 
CTTGGCTAAG 
TATTCTTCCT 
CCCAAGCTGG 
TTGAGATCAC 
T CTGT AAT C A 
GTTACATTTG 
GTGTGTCTTG 
CACATTTTCA 
ATGTTTAATG 
TTTGCACATT 
CACCACTTTG 
CTGAGATTCA 
TTAAACAGCT 
TTTGGGTGTT 
TACTTCTAGA 
TTGTTTTGTT 
CCAGGCTGGG 
GTGATTCTCT 
GGCTAATTTT 
AACTCCTGAC 
CCACCGCGGC 
TCCACCTTCA 
AGGACTGCCC 
TGTGGGTTTA 
AATACCATAT 
AATGTGTCAT 
GCCAGGCTGT 
TGGGATTACA 
GTTTTGGCTA 
TGGCTTATGC 
AGGAGTTCCA 
ATTAGCCAGG 
GGATCACTTG 
AGCCTGGGTG 
CTACAACAAC 
TATAAAACTG 
GGTCTGTCTT 
TTTCAGTGTA 
AAATTTCAAA 
TATCCTTCAG 
TCATGTGTTC 



TGGCGCTGTA 
GTGAGAGCTG 
AAGCCATGGA 
ACGAGGATGG 
CTGATGTGAA 
GACACTGTTC 
TTCGGATCAG 
ACATGGCTGC 
GCACTTCAGT 
AGCTGAT CAG 
CAGGCTTCAC 
CCCTCTTTGA 
AAGTATAATT 
ACTCTTTTTT 
TCTCAAACTC 
AGGCGTGAGC 
CAGCATTCCT 
AATCTCTTAA 
TTTTCTGGTC 
AAT CACATGC 
ACATACTAAT 
TCCACCATGG 
GAAGGGGACA 
GATTGACTGA 
GACATTTTAA 
GCATCCGAGA 
AGTGTTATAA 
TTGTTTTTTC 
GTGCAGTGGC 
TGTCTCAGCC 
TGTATTTTTA 
CT CAAGTGAC 
CAGCCTATGA 
CTTTTTCTTG 
TTTGCTCTAT 
TTTCAGGACT 
TTGTATGTAG 
ATTTTTGCTG 
GTTGAACTCC 
GGCGTGAGCC 
TGTTAAGTCC 
CTGTAATCCT 
GACCAGCCCG 
TGTGGTGGTG 
AACCCCAGAG 
ACAAAGTGAG 
AACAACAAAA 
TTGGGAGAAT 
CCTAGGTATT 
CAGGTCTACC 
TTCTAACCAC 
CCTTGCTAAA 
TATGAATAAA 



GGACTAGAAC 1 

GTGGTTGGCA 

ACTGATCCGC 

ACTCAGACAA 

TGAAGCAAAG 

TCTGTTAAGA 

AGCACTCAGA 

TGAAGAAGTC 

CCTATTAAAA 

ACAAGGAGTC 

TCAACTCATG 

TTTTAGAAGC 

TGCTAACTAT 

GGTTTTGGTT 

CTGGCCTCAA 

CACTGCACCC 

ACAGTTGTTA 

ATAAGCAGTC 

ATGTGTATTG 

AAGTGAAGAT 

TTATCATCTG 

TGGCTGGTGT 

GTGAAATTGG 

AAAGTCACAT 

ATTTTGATGA 

AATCTTTTCC 

TTTTAAGCTT 

GTTTGTTT CT 

GTGATCTTGG 

TCCCAAGTAG 

GTAGAGACAG 

CCACCTTGGC 

TCCATTTTGA 

GGAATATAGA 

CACCTTTGCA 

CTGTTTTGTT 

TGTATGTAAT 

TTGTTTGTAT 

TGAGCTAAAG 

TTGGTGCTGG 

TTTGCTTTTG 

AGAACTTTGG 

GGCCTATGGC 

CATGCCTGTA 

GTCAAGACTG 

ACTCTATCTC 

ACCCCTGTTG 

TGACATCTTA 

AATGTTTTGT 

ATGTCAGCAT 

TTGTTGCTAG 

CTGTGAGTTC 

GAGTTTTACT 



60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
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Seq ID NO: 158 Protein sequence: 
Protein Accession #: Eos sequence 



11 



21 



31 



41 



51 



246 



10 



15 



20 



25 



WO 02/086443 

MFCEKAMEL I RELHRAPEGQ LPAFNEDGLR QVLEEMKALY EQNQSDVNEA KSGGRSDLIP 
TIKFRHCSLjL RNRRCTVAYL YDRLLRIRAL RWEYGSVLPN ALRFHMAAEE VRCLKDYGEF 
EVDDGTSVLL KKNSQHFLPR WKCEQLIRQG VLEHILS 

Seq ID NO: 159 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 149-229 



PCT/US02/12476 



i 
1 

GTTCGGCGCC 
CGAAAGGAGT 
AAGGCCGCGG 
CGAGCTGCAT 
GGCACACACC 
GGAAGTTGAA 
TGAATCCCTG 
AAGCTTTGTA 
GTAGCATACC 



11 
I 

AAAG CGCGGA 
GAGGCGCCGA 
GAGTGGGAAG 
CGCGCGCCCG 
TGTAGTCCCA 
ACTGCAGTGA 
TCTCAAAAAG 
TGAACAAAAC 
TGTATGACCG 



21 

I 

GCGGAGGCCG 
GAGCCCAGAT 
CGTCCGCCAT 
AAGGGCAACT 
GCAACTTAGG 
ACTGTGGTCA 
GAAAAGGAGG 
CAGTCTGATG 
CTTGCTTCGG 



31 
I 

AGG CGAGAGC 
ACCATTTTGG 
GTTCTGCGAA 
GCCTGCCTTC 
AGGCTGAAGT 
CGCTATTACA 
ATGGACT CAG 
TGTTCTCTGT 
ATCAGAGCAC 



41 
I 

CTGGCGCTGT 
CGTGAGAGCT 
AAAGCCATGG 
AACAATTAGC 
GAGAGGATTG 
CTCCAGCCTG 
ACAAGTTCTG 
TAAGAAAT CG 
TCAGATGG 



51 
I 

AGGACTAGAA 
GGTGGTTGGC 
AACTGATCCG 
TGGGTGTGGT 
CATGGCTCCA 
GGTGACAGAC 
GAGGAGATGA 
ACGCTGCACT 



Seq ID NO: 160 Protein sequence: 
Protein Accession #: Eos sequence 



11 



31 



41 



51 



21 

I I I I I I 

ATGTTCTGCG AAAAAGCCAT GGAACTGATC CGCGAGCTGC ATCGCGCGCC CGAAGGGCAA 
CTGCCTGCCT TCAACAATTA G 



60 
120 



60 
120 
180 
240 
300 
360 
420 
480 
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Seq ID NO: 161 DNA sequence 
Nucleic Acid Accession #: U10694 
Coding sequence: 1333-2280 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



GGAT CCGGCC 
ACAGGGAGGC 
AGGAACCTAA 
TTTGCCCTGC 
CCTTTATCCT 
CACGTCAGCA 
CCCACTCACC 
CCGCTGGGTG 
AGGTCAACAG 
CTCACCCCAG 
AACCCTGGGC 
ATGTGAGCTC 
CAGGAGAAAG 
AGAACTCAAG 
CAGTCTGCAG 
CTTGGTCTGA 
TGAAGGTGAA 
GGACCCCATA 
AGGCTAGCTG 
ACCAGGAGGA 
GCCTTTGTTA 
TCCCCAGGCC 
ACCAGAGTCA 
GAAGCCCAAG 
GAGACTACCT 
CCTCCCCAGA 
AGCCAATTCG 
CCAGCTCAGC 
CATTTCCTGC 
AGCGTCATCA 
ATGCAGGTGA 
CTTGTCACTG 
AAGGCCGCCC 
GAAGAGGTTA 
TTCTACGGGG 
TACCGGCAGG 
CACGCTGAAA 
CCCATCTGCT 
GCACCAGCCG 
GCCCCATGTG 
CAGTGGCAGT 
GTGATTTGGA 
AGTTTAATGA 
ATGTTATTTA 
TGAATTGGGA 
CAGCAAAATA 
ACCTCTTTCT 
TCTTTGAGCA 
TTTTTTCTTC 



11 
I 

GGAT CTC AGG 
CCTGTGTTCG 
GGGAGGAT CG 
CCCTACTGTC 
GGGATCACTG 
GAGGGAGGGT 
AAACACAGAG 
G ATGGACT CC 
AGGGAGGGTT 
GACACATGGA 
AGGTGTGGGC 
CTGATCTGAG 
GTCAGGGCCC 
AGTGTCCAGC 
CCTAAGGGCC 
GACAGTGTCC 
GTGTTCACCC 
GCACCTGGCC 
CACGCTGAGT 
CAGGAGCCCC 
GAACCTCCAA 
TGTGGGTCTC 
TCATGTCTCT 
GAGAGGACTT 
CCTCCTCTGA 
GTCCTCAGGG 
ATGAGGGCTC 
TGGAGTTCAT 
TCCACAAATA 
AAAATTACAA 
TCTTTGGCAC 
CTCTTGGCCT 
T CCTGAT CAT 
TCTGGGAAGC 
AGCCCAGGAA 
TGCCCGGCAG 
CCAGCTATGA 
ACCCATCCCT 
CAGCCGGGGC 
ACATGAGGCC 
GGGTGGAAGT 
GATTTATCCT 
ACTTCACCAT 
GGAGTAAGAT 
CAAGATAACA 
GAGCTCATAA 
CTCTCCTGTA 
TGTAAGAGAA 
AGACACGCAC 



21 
I 

GAGGTGAGGA 
ACAGACACAG 
AGGGTACCTC 
ACCCCAGAGA 
GTGTCGGGGA 
CCCAGGCCCT 
GACCTAGCCC 
CCTCACTTCC 
CCAGACCCTG 
CCCCATTGAA 
AGATGTTGGT 
AGACTCTCAG 
TGAGTGAGCG 
CCGCCCTCTT 
CCTCGATTCC 
TCAGGTCGCA 
TGAATGTGCA 
CCATTCCCCC 
AGCCCTCTCA 
AAGAGGCCCC 
GGTTCGGTTC 
CATCGCCCAG 
CGAGCAGAGG 
GGGCCTGATG 
CAGCAAGGAG 
AGGCGCTTCC 
CAGCAGTCAA 
GTTCCAAGAA 
TCGAGTCAAG 
GCGCTACTTT 
TGATGTGAAG 
CTCGTGCGAT 
TGTCCTGGGT 
GTTGAGTGTG 
GCTGCTCACC 
TGAT CCTGCG 
GAAGGTCATA 
TTATGAAGAG 
CAAAGTTTGT 
CATTCTTCGC 
GAGCACACTG 
TGCTCCCTTT 
CGAAGTTAAT 
TCTTGCTTTT 
TAGCAGAGGA 
AGAAATAGTG 
AAATTAAAAC 
ATAAAAATTG 
TGAACATCTG 



31 
I 

CTTTGTTCTC 
TGGTCCCAGG 
CAGGCCAGAG 
GCCCGGGCAG 
GGGCTGGCCT 
GCCAGGAGTC 
CACCCTGCCC 
TCTTCAGGTG 
CAGGCATCAA 
TTTAGACATC 
TGGGGCATGT 
GCAAGTAGAG 
CAGAGGGGAC 
GACAGCACTG 
TCTTCCAGGA 
GAGCAGAGGA 
CCAAGGGCCC 
TACTGTCACT 
CTTCCTCCCT 
AGAGCAGCAC 
TCAGCTGAAG 
CTCCTGCCCA 
AGTCCGCACT 
GGTGCACAGG 
GAGGAGGTGT 
TCCTCCATTT 
GAAGAGGAAG 
GCACTGAAAT 
GAGCCGGTCA 
CCTGTGATCT 
GAGGTGGACC 
AGCATGCTGG 
GTGATCCTAA 
ATGGGGGTGT 
CAAGATTGGG 
CACTACGAGT 
AATTATTTGG 
GTTTTGGGAG 
GGGGTCAGGG 
TCTGTGTTTG 
TATGTCATCT 
TGGAATTGTT 
GAATGACAGT 
GAGTCACATG 
ATTAATAATT 
AAATGAAAAT 
ATATACATGT 
AAAGAATAAT 
TTATTCGGAA 



41 
I 

AGAGGGTGTG 
ATTGGAGAGC 
AAACTCTCAG 
GGCTGTCTGC 
TGGT CTGAGG 
CAGGTGCAGA 
CTTGTGTCAG 
TCTCCTGGAG 
GATGAGGACC 
TCTTACTGTA 
CCTTCTGTTC 
GAGTAGAGTC 
CATCCACCCC 
AGGGACCGGG 
GCTCCAGGAA 
GACCCAGGCA 
CACCTGCCCC 
CATAGAGCCT 
CAGGTTCTCG 
TGACGAAGAC 
TCTCTCACAC 
CGCTCCTGAC 
GCAAGCCTGA 
AACCCACAGG 
CTGCTGCTGG 
CCGTCTACTA 
AGCCAAGCTC 
TGAAGGTGGC 
CAAAGGCAGA 
TCGGCAAAGC 
CCGCCGGCCA 
GTGATGGTCA 
CCAAAGACAA 
ATGTTGGGAA 
TGCAGGAAAA 
TCCTGTGGGG 
TCATGCTCAA 
AGGAGCAAGA 
CCCCATCCAG 
AAGAGAGCAA 
CTGGGTTCCT 
CAAATGT T CT 
AGT CACACAT 
GGGAAATCCC 
TTTTTGAAAC 
GTAGTTAATT 
ATACCTGGAT 
TTTTCCTGTT 
CACCCTGGGT 



51 



TGTGGACAAA 60 

AGTCCAGGTG 12 0 

AT C AAG AG AG 180 

TGAGGTCCCT 240 

GGGCTGCACT 3 00 

CTGAGGGGAC 3 60 

CTGAGGGAAG 420 

ATAGGGCCTC 480 

AGGCAGTATC 54 0 

CTTCCGAGGA 600 

CAT AT CAGGG 660 

CAGTCCCTGC 72 0 

AAAAGTGTGT 78 0 

GCTCTGCCTG 840 

GCAGGCAGGC 900 

GTGT CAGCAG 960 

AG CACACATG 102 0 

TGATCTCTGC 10 80 

GGACAGGCTA 1140 

GTGTAAGTCA 12 0 0 

ACTCCCTCTC 12 60 

TGCTGCCCTG 132 0 

TGAAGACCTT 13 80 

CG AGGAGG AG 1440 

GTCAT CAAGT 150 0 

CACTTTATGG 1560 

CTCGGTCGAC 162 0 

TGAGTTGGTT 1680 

AATGCTGGAG 1740 

CTCCGAGTTC 1800 

CTCCTACATC 1860 

TAGCATGCCC 1920 

CTGCGCCCCT 1980 

GGAGCACATG 2040 

CTACCTGGAG 2100 

TTCCAAGGCC 2160 

TG CAAG AG AG 2220 

GGGAGTCTGA 22 80 

CAGCTGCCCT 2340 

TCAGTGTTCT 2400 

TGTCTATTGG 2460 

TTTAATGGTC 252 0 

ATTGCTGTTT 2580 

TGTTATTTTG 2640 

TTGAACTTAG 2700 

CTTGCCTTAT 2 760 

TTGCTTGGCT 2820 

CACTGGCTCA 2880 
T 



85 



Seq ID NO: 162 Protein sequence: 
Protein Accession #: AAA68877.1 



247 



WO 02/086443 



PCT/US02/12476 



10 



15 



20 
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30 



35 



40 



45 



50 



55 



60 



65 



70 



1 


11 


21 


31 


A 1 

41 


51 
1 




1 

MSLEQRSPHC 


1 

KPDEDLEAQG 


1 

EDLGLMGAQE 


1 

PTGEEEETTS 


1 

SSDSKEEEVS 


AAGSSSPPQS 


60 


PQGGASSSIS 


VYYTLWSQFD 


EGSSSQEEEE 


PSSSVDPAQL 


EFMFQEALKL 


KVAELVHFLL. 


120 


HKYRVKEPVT 


KAEMLESVIK 


NYKRYFPVIF 


GKASEFMQVI 


FGTDVKEVDP 


AGHSYILVTA 


180 


LGLSCDSMLG 


DGHSMPKAAL 


LIIVLGVILT 


KDNCAPEEVI 


WEALSVMGVY 


VGKEHMFYGE 


240 


PRKLLTQDWV 


QENYLEYRQV 


PGSDPAHYEF 


LWGSKAHAET 


SYEKVINYLV 


MLNAREPICY 


300 


PSLYEEVLGE 


EQEGV 













Seq ID NO: 163 DNA sequence 
Nucleic Acid Accession #: AF292100 
Coding sequence: 30-80 9 



75 



GGGGGGGGAG 
AAGTT CGTCA 
CTCAAAATGA 
ATATACGAGA 
GATACAAAGA 
ATGACCTGGC 
CAGCAACACA 
GTGACAGCAT 
CAGGACGATT 
AAGGATTAGA 
AATTCTTAGA 
ACACTTGGAA 
ATGAAGAAGG 
TTGCTGGGAC 
CTGTACAATA 
AGATCAATCC 
CCATATCGTA 
TAAACATTTA 
ATTCTCCCAT 
AAGCACAATG 
CAAAACAATT 
AATAGCACTT 
TTTGGGGGGA 
ATGAAAAAAC 
CTGAAAAATG 
GCTTACCTTA 
CTGCATAATG 
TGCTTTTGAA 
TTTTGGATTG 
TTTTACTTTT 
AAGATAGTAG 
AATATAGGTA 
AATTACTTTA 
C AAACAAG C A 
TCACTCAGAT 
GTGTGTGTGT 
T T* T T T T T T T 
ATTTCCCTGT 
TAAGGCAGGC 
TAGATTCTGC 
AGGAATGTAC 
ATGACATATC 
G AC AT AT TAA 
TTTGAAAATT 
ATCTTGCTGC 
GAAAAATTTT 
TGTCTTGAAG 
GTTTTCTTTA 
TTTTAAATGC 
TATAATTACT 
T AAAAGT TAA 
CTGAAAAGAG 
AGGGAATATT 
CTGTGAGAGA 
CCCCTTGAAT 
TGATTCTTTG 
GGTACAAATT 
C A CAT AT AAA 
GTAAGTTCAA 
GCAGTGAAAT 



11 
I 

AGGCCTGGAG 
GTTTATGATC 
CTGGAAGTTA 
GAGTGTAAAA 
CCCTCAAGAT 
ACTCGATCCA 
GTGCGAGTTC 
AGAACAACTA 
TAAGGATTTT 
TCTAGAAATG 
CTTATGGAAT 
TCTTCTTTTA 
AGCATGGCCT 
AAAAAGTACA 
AATACAACAG 
TCACAATTCA 
TTTCATTCTT 
TAATT CCAAC 
AAGTCTTAGA 
CTGTCTTCAT 
TATAAAAACT 
CCAGTGAGAG 
ATTTTTTTTT 
AATGTCAGAA 
TATTGTGTTT 
CCCATGTTTA 
TTAGATTCTT 
ATGCTTATCT 
CTACACAATA 
TTTTTGTCAT 
GAGTTAAATT 
CTGCTCTTTC 
ACTGCTAATC 
TACACGATGC 
TAGCTCAGTT 
GTGTGTGTGT 
TTTTTTTTAA 
TCACTTACTG 
TAGAAATGTA 
TTGGGATATA 
TTAGAATAGC 
AAAACTGCTT 
T ATT CCAAT C 
TCTATTCAGG 
TTTCAGTATT 
TAAAAGATAT 
ATTTTGAGTT 
AAAGT CAT AT 
AAAACCTTTT 
GTGTAATTAT 
GGTTGTTCAC 
AAGACTGATT 
TTGTACTAAA 
GCCAGAGAGA 
TGCTTTAACT 
TTTTAAACTG 
TTAAAATGTA 
AAATACTTGA 
TTGTGTTTCT 
TG 



21 
I 

GACACCAACA 
TTCACACAAT 
GATGTTGCAA 
GGATCATTGG 
GAGAATAAAA 
GCCAGCATTA 
TCCAAACAGG 
AAGGCCCAGA 
TACCAGTTTA 
GCCATTGCCT 
AAATTTTTGT 
GACTTCAGTA 
GTTCTTATTG 
ACAGTGTAGC 
AAAATTGCAC 
GACTGAGGGT 
CTAATGGTGG 
ATTGTGGATT 
AGCTTTATGG 
CAGAAAACAG 
TCTTAAATAT 
TGATATATTT 
TTTCCTGGCA 
TAACCGACAT 
TAGACTCTTG 
TATATAGCTG 
CTCCTGTCTA 
GCCTGTCACA 
CAATATTCTA 
TGCACTATGG 
TTGAAAATGG 
AGACAAACAG 
ACTGTGGTTG 
AAAATACCAG 
TTCTCATCAA 
GTATGTGTGT 
ATTACAAAAG 
ACATGTGAAG 
ATACTT CAAA 
TAT CCAGGCA 
AGTACATTTT 
TTTACATGAT 
ATAACTTTAA 
CTACTGGAAT 
TCCTGATTTT 
ATATATCTAT 
ATGGTTATTG 
GGGTT CGTGG 
CAACAAAATA 
AAACAAAAAT 
TATGATGGCA 
TAATGTGGTG 
AAATGATTAC 
GTGAGAGAGA 
CCTAAGTGTT 
AACCATAGGT 
ATGCTTTTTA 
GATGAAGATT 
TACAGTCCCT 



31 
I 

TGAACAAGTT 
CTAGTGAAAA 
CAGATAATTT 
ACAGGAAGAA 
TTGGAATAGA 
GTGTGTTGAT 
AGTTCATGGA 
TACCCAAGAT 
CTTTTAATTT 
ACTGGAACTT 
TGGAACATCA 
CGATGATTGC 
ATGACTTTGT 
ACTAAAGGAA 
AGTCAATTTC 
TGAGACAAAA 
TTTGGGCTTG 
TCATCTTATA 
TGATTATTTT 
TTGGCATAAG 
ACGCTTTGGG 
AAGTGTACTG 
AATCACATAT 
GAAAATTTTT 
ATTTCAAAAG 
TCCTACAGGG 
CATTATGCAC 
TAAGTTAAAC 
AATTTAGGCA 
AACACAAATG 
TTGTGATGAG 
TCCATTTTTA 
CCAAATATTT 
TCTGGCTTCT 
AGCAGAATGC 
ATATATATAT 
CCATGAGCTG 
AAGGGTTTCT 
TGTTTGATGA 
CTCTCTAAGG 
ATGCAAATAT 
TTTGAAATAG 
TTCAAGAATG 
TGGTTATTAA 
TTTGTAAATA 
ATATCTATAT 
GTTTCAGATT 
CCTAATGCCT 
GTGTTTGTCA 
ACATAAAGCT 
TCTTAGAATT 
TGATTATTCT 
ACATATGGCT 
TTGACAGAGA 
TCAGTCCTCA 
ACAGTTTCCT 
AATAGAAAAA 
ATCTTTAGTG 
GTCATATTAC 



41 



51 



GAAATCATCG 
AACAGCAGTA 
TTTCCAAAAT 
GTTAGAACAG 
TGGCATACAG 
TATTGCGTGG 
TGGCATGACA 
GGAACAAGAA 
TGCAAAGAAT 
AGTGCTTAAT 
TAAACGATCA 
AGATGACATG 
GGAATTTGCA 
CCTTTTAGAA 
TGCTGGCTGG 
CTTTAAGGAT 
TCTTCTAGTC 
TCTGTGGACC 
GAGGTTTTCA 
AATTAAACAT 
CTAGTTGCAA 
GATCTGGAAT 
GTTGTTGATG 
TAGGATAACT 
GTTCCACAGA 
AGCTTTTATT 
TACATAATTG 
TATTTAATTT 
TGAGGGTTTT 
AAATTCTCTT 
CCACGAAATT 
ATGACTTCTT 
ACTTCAGAAG 
AGTCTATTTA 
TATCTTGCGT 
ATATATATAT 
CTTTTATGCT 
TGCTTTCTTA 
TTATGGTCTT 
TCTAGGGTTG 
GGAAATTATT 
ACTAGAAAGC 
CAGTTTTACC 
AAGAAAAAGG 
TAAAGAGGAA 
ATATGTACTG 
GATTAATTCA 
TGGATTTTAC 
TCAGGTTGGT 
TTGAATATAA 
AAACAAAACT 
GAAGATAAAT 
GTGTGTGTTT 
AAGGGAGAGA 
TTCCGGTAAA 
TTTTGCCAAA 
TGTATAAAAT 
AATATCATCT 
CAACAGAGGC 



CAGAAGGATA 
AGTTGTCTTT 
CCTGAACTTT 
CTGTACAATA 
CAGTTCTGTG 
AAGTT CAG AG 
GAATTAGGAT 
TTGAAAGAAC 
CCAGGACAAA 
GGAAGATTTA 
ATACCAAAAG 
TCTAATTATG 
CGCCCTCAAA 
TGTACATAGT 
ACTGAACTGA 
ACATCTTGGA 
TGGGCCGCTC 
AT CCT AGTTT 
TTCTCGCATA 
ATGAACATCA 
AGACTATGCT 
GGTGTTTTGG 
TGAGTATCTG 
TGGTGCCTAC 
ACTAGTCTGC 
TAGAAAATGT 
GACTT CATT A 
GTTTTGAATG 
TTTGTTTTAT 
AATTTATAAG 
CAATCTTTAT 
ATTTTGTTGA 
CAAAGATTTT 
CTGTTTTGTT 
GTGTGTGTGT 
ATATATATTT 
GAAAATGGTC 
AACATTT CCG 
TTGATAGGAA 
ATATTAACAA 
TTAAGAAACA 
TTTCCCTATA 
AAAAGAAAAA 
AAAAAGAAGA 
CTTCAATTAT 
TTTTGTTTCC 
CATATGCTGT 
ATATTTTTCT 
ACTAAACATT 
TTATGTAGCA 
TTTACTAGGG 
GT CTGGCT AC 
GAGTCTGTGT 
CACACACACG 
CTCCCCATGC 
TGT CAAAACA 
TAGAAGTGCC 
GCATATCTCT 
AATAAAAGCT 
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85 



Seq ID NO: 164 Protein sequence: 
Protein Accession #: AAG00606 

1 11 21 31 41 51 

I I I I I l 

MNKLKSSQKD KVRQFMIFTQ SSEKTAVSCL SQNDWKLDVA TDNFFQNPEL YIRESVKGSL 60 

DRKKLEQLYN RYKDPQDENK IGIDGIQQFC DDLALDPAS I SVLIIAWKFR AATQCEFSKQ 12 0 

EFMDGMTELG CDSIEQLKAQ IPKMEQELKE PGRFKDFYQF TFNFAKNPGQ KGLDLEMAIA 180 

YWNLVLNGRF KFLDLWNKFL LEHHKRSIPK DTWNLLLDFS TMIADDMSNY DEEGAWPVLI 240 
DDFVEFARPQ IAGTKSTTV 



248 



WO 02/086443 
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Seq ID NO: 165 DNA sequence 
Nucleic Acid Accession #: AF256215 
Coding sequence: 220-2028 
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i 
I 

CTCCAGTCCG 
GCCTACGGGC 
CCTGCTCCAG 
CAGCCGCCGG 
GCGGCGGGAG 
CGCGTGAGTC 
TTTCCACGAA 
CAAGTTAAAA 
AAAATGAATA 
CGTAAACTGG 
GGCTTGACAA 
CTCAGACATT 
GGAAAAATTC 
TTGACTGGAC 
CAACTTTCTT 
CAAGTTCACA 
TTTTTCTGTC 
AACTCAAAGA 
AGCTGGCCTC 
AATTTTACCT 
GGAGAGATTA 
GTCTATGTAG 
ACTTCTTGTT 
GCAGTTCTAC 
GGCTCTTTTG 
CTGGAATATA 
TCATTTTTAC 
GTACCTGGAA 
AATGAAATTC 
ACAGGTTTAA 
TTTCCACCAA 
GTTGCTGTCC 
CTATGTGACA 
GGCCTGGGAG 
AACTCCAAAA 
TTAAGTACTG 
TTGCATCTTC 
TATTATAGAC 
TAAAATATTT 
TGCAGTTTTT 
GATTTATAAT 
ATTGAGGATA 
AGTGCAATTT 
AG CACAGAGC 
GATTTCTTGC 
GGATCTTGGG 
CCAGACGTGG 
CTTGAGGTCA 
AATACAAAAA 
TGACAGTCCA 
ACTGCTTGGG 
GCCGAGATCG 
AGTAAAAAAA 
TGACATTGGA 
GATTAAATGT 
TTTAAATGTT 
CACAGATTAA 
GCAATTACAG 
AAAT TATGAG 
GGAGAGCATT 
ATTATTTAAA 
TCAGTAGCTC 
ATGAAAGTCA 
AATCCAGTTT 
TCGCCAAAAC 
TTAGAACTTC 
TGTTTCCTTC 
CCTCTTGAAC 
TTGAGGACCT 
AATTGGTGTG 
GTGTTCTCTA 
CATTGCAGGT 
CAT CAT AGCT 
TTTGAGAGGC 
TCTTTGCAAG 
ACTCTGTGCA 
GTCCTGGACT 
GTTTCCTTCA 
CATATTTTTA 
TCGTGAGAAA 



11 
I 

CATGCTCAGT 
TGCGGTGGCG 
AGCCGCCGCC 
GCTGCGGAGC 
GTAAAGTGTT 
CAGGGACAAG 
AACGCAAAGG 
TGAAGGCCTT 
ACCTGATTGA 
ACAAACTTAC 
ATTCTTATGT 
TAATCCTTAA 
TCTTCGTTTC 
AAAGCTTATT 
CTTTTGATAT 
GTAATCTCCA 
GGATAAAGAG 
AGAAAGAGCA 
CAAATATTGT 
GCCTTGTGGC 
ATGTGAAACC 
ATCAAAGGGC 
ATGAATATTT 
AGAGTAAGGA 
TAACTTTAAA 
TTGTATCTGT 
CTTGTAGCTC 
TGTCTACTGG 
TGGATTTACA 
TGAAAGATAC 
GTCCTTCTGA 
ACAGCCATGA 
ATGATGACAC 
ACCCTGGGGA 
ATGAGAAACA 
TATTGATATT 
CTGTCACAGG 
TCCTTTATTC 
CTAACCAAGA 
TTTAGTTGAG 
AGTAGGTTTG 
GGGCTTACAC 
ATAGTCATAA 
TGGGATATTT 
TTAAAACTCA 
CCCTAGATCT 
TGCTCACGCC 
GGAGT T CAAG 
AAAT TACCCA 
TTCATGAGCG 
AGGCTGAGGC 
CACCACTGCA 
AAGATTTAAT 
AACATACTTA 
CTTGTGTAAA 
TAATGTATAT 
ATGATTAACT 
TTATTGCCTG 
GCAATGAGAA 
TTTAACAGTA 
ATACTGCATG 
TTCATAGCTT 
GATAGGCTGG 
CCTGTTCTAT 
AAAGCATTAT 
TGTCAGACAT 
AAGTGTGAAA 
TGATAGTGTC 
GAGAGACATC 
CAGCAGCCTA 
AATTG AG CAG 
TAGACTTGGC 
GGATGGCCTC 
AGAGT TTCTA 
AGGAGGGGCT 
TGGTTTGATC 
CAAAATCTAA 
AAATGTTTTA 
TGGTATACAC 
GAATATATCT 



21 
I 

AGCTGCTGCC 
GCCGCCGCGG 
TGGGCCGGGG 
CGACCAAGTG 
GAGAGAGGAG 
ACCAACAGCT 
AAGTGATTCA 
CAGAGAAGCT 
AGAACTGTCT 
AGTTTTAAGA 
GGGAAGTAAT 
GACTGCAGAA 
T AAGTCAGT C 
TGACTTCTTA 
TTCACCAAGA 
CGCTGGAAGG 
TTGTAAAATC 
CAGAAAATTC 
TGGAATGGAA 
CATTGGAAGA 
AACTGAATTT 
AACAG CGATT 
T CATC AAGAT 
GAAAATACTT 
AAGCCAATGG 
CAACACTTTA 
TCAATCATCA 
AACAGTACTT 
GAGGTTACAG 
TCATACTGTA 
AATGGGGGAG 
GCCACTCCTC 
AGCCATGGCT 
CTTCAGTGAC 
TTTTAAAGCA 
GTTTGTATCT 
GATGTGGGGA 
AGTGAAATGG 
ATACTACTTA 
GTAATGTAAT 
TATAATTTGG 
ACTTTAAGAA 
TCACATTGAA 
ATGCTCAGTT 
GAAAGTCAAA 
TGGGGATTAA 
TGTAATCCCA 
ACCAGCCTGG 
GGCACTCACT 
CAAAGGCCTC 
GAGAGGATTG 
CTCCAGTCTG 
ATAATCACTG 
GGGATAGATT 
GTCACACATT 
AAACCAGTTT 
AACTGACCCA 
TAACCAAAGG 
ATAATTTAAA 
ATTAATCCAG 
TCTACCTTCT 
GCCAAGTATG 
GAACTCATGG 
ATGGTGCTAC 
TTTGACCCTG 
GTTAATGACA 
TGTGCAGGGG 
CCAGCAATGT 
AGGTTTAGAA 
AGTGTTATAG 
AGGGGCCTGC 
TTCCAAAGAG 
AAAAGCAGAT 
GAGGGAGACC 
GTTCAATTCC 
CTTTATTAGT 
TCCATGCATT 
GTTTTCTTCA 
TATGTTCCTT 
ACAAATTGCA 



31 
I 

GGCCGGGCTG 
CACCCGGCAG 
CAGGGCGGGC 
GCTCCTGCGA 
AACCAGTGCA 
ATGGGGTCTT 
GACCCATCCC 
CATAGCCAAA 
GCAATGATCC 
ATGGCTGTTC 
TATAGACCAT 
GGCTTCTTAT 
TCCAAAATAC 
CATCCAAAAG 
GAAAAGCTAA 
ACACGTGTGT 
TCTGTCAAAG 
TATACTATCC 
GAAGAAAGGA 
TTACAGCCAT 
ATAACCCGGT 
TTAGGATATC 
GACCACAATA 
ACAGATTCCT 
TTTAGTTTCA 
GTTTTGGGAC 
GAAGAATCCT 
GGTGCTGGTA 
TCTTCTTCAT 
AACTGCAGGA 
CTAGAGGCTA 
AGTGATGGTG 
GCATTTATGA 
ATCCAGTGGA 
TTATTTACGA 
TTTATTAATG 
AATACGTTTT 
CTTATAATCC 
CATATTGTTT 
ATATTGATGT 
AACATTTTCC 
AACAGTGAGT 
TACTGTATTT 
GAGCACTTTA 
AGAGTTTCAG 
CCTCTGCATA 
GTACTTTGGG 
CCAATATGGT 
CTTGAGGTAA 
ATGACCTAAT 
CTTGAACCTG 
GGCAACAGAG 
AAGATCT CT A 
TGTCCTAAAG 
AAATTCAGTC 
CTTTATACAC 
GGAACTAGTT 
TAATAAAACA 
AACCAATTTT 
AGGTGGCTCA 
CGGGGATCAT 
CTCCCATATT 
GGCAGCCCTC 
ATCTTTCCAG 
CATGCTATTT 
AACATACCAA 
CTCGTGGGCA 
TGGAGGTTGG 
TGAGCCAAAG 
TTAAGTCTAA 
CTACCAATAT 
TCTGCCTAAG 
GGGGG CAGAC 
AGTGCTGCCT 
ATAGACCAGT 
TCGCTCTAAT 
GTATGATACC 
ACTAAATTTG 
TTTTCTACTG 
CGAAAGTATC 



41 

1 

CGGGGCGGCG 
GGCCCGCCAG 
CCGGGGCTCC 
TGGCGGCGGA 
TTGCTCCTGT 
TCAGCTCACA 
AAGTGGAAGA 
CTGAAAAGCG 
CTCAGTGCAA 
AACACTTGAG 
CATTTCTTCA 
TTGTGGTTGG 
TTAATTATGA 
ATGTTGCCAA 
TAGATGCCAA 
ATTCTGGCTC 
AAGAGCATGG 
ATTGCACTGG 
ACAGTAAGAA 
ATATTGTTCC 
TTGCAGTGAA 
TGCCTCAGGA 
ATTTGACTGA 
ACAAATTCAG 
CAAATCCTTG 
ATAGTGAGCC 
CTAGACAGTC 
GTATTGGAAC 
ACCTTGATGA 
GTATGTCAAA 
CCAGGCAAAA 
CACAGTTGGA 
ATTACTTAGA 
CCCTCTAGCC 
AAAAACTGTC 
TTCTACCACT 
CCTCCCAAGA 
ACTAGTTGCC 
TGGCTTTGTT 
TTTCCTTTGT 
ATGCCTTGCG 
ACTTGAACAT 
GATCTTTGGA 
AGATGAATTT 
CTTTCCTTAC 
TAAGATTTAC 
AGGCTGAGAC 
GAAACCCCGT 
CTAACCAACT 
GGCACACACC 
GGAGGCAGAG 
TGAGACTTCA 
TTATAGATAG 
GAAAAAAGTA 
ACACATTAAA 
ATTTGGGAAA 
GTAGCTTTCT 
AAATGACAAG 
CTAGTTATAA 
AATTGAGTAT 
ACTTTATAAC 
TTCTCTCTCG 
AGACTTCAAT 
AAAATTTCCC 
CTTTAGCTGT 
CAGACAATAA 
AGGATGTATT 
CACCATTCCT 
AAATCCTACA 
AGAAGTATGA 
CACTTTTTAG 
CCAGGGGTGG 
TTGCCCTCGT 
CTCACAGTGG 
GGGCAGATAG 
ATTTTTCTGT 
GTAGCTCTCC 
ATTTTTGCTG 
CGAGTCAATT 
ATAAAAACAG 



51 
i 

TCCGCTGCGC 60 

TCCCCGCTTC 120 

TCCATGCTGC 180 

AGAGGAGGCT 240 

GGTTTCCAGC 3 00 

CATGACAGAG 3 60 

TGGTGAACAC 42 0 

GAGGAGAGAT 4 80 

CCCCATGGCG 54 0 

ATCTTTAAAA 600 

GGATAATGAG 660 

ATGTGAAAGA 72 0 

TCAGGCTAGT 780 

AGTAAAGGAA 840 

AACTGGTTTG 90 0 

AAGACGATCT 960 

ATGCTTACCC 102 0 

TTACTTGAGA 10 80 

AGACAACAGT 1140 

ACAGAACAGT 1200 

TGGAAAATTT 1260 

ACTTTTGGGA 132 0 

CAAGCAC AAA 1380 

AGCAAAAGAT 1440 

GACAAAAGAA 1500 

TGGAGAAGCA 1560 

CTGTATGAGT 1620 

AGATATTGCA 1680 

TTCGAGTCCA 1740 

TAAGGAGTTG 180 0 

CCAGAGTACT 1860 

TTTCGATGCC 1920 

AGCAGAGGGG 1980 

TTTGATTTTT 2040 

TCAACTATTC 210 0 

TTTTATAGAT 2160 

GAACCAAGTT 222 0 

ATATTTTTGC 22 80 

TTATTTTTGA 2340 

GTCTAAGATT 240 0 

AATTTCCTTA 2460 

TTAAAGGGAC 2 52 0 

GACTTAGGCA 2580 

TAAGTGAGAT 2 64 0 

AGAAAAGGAA 2700 

TCTTAATAGG 2760 

GGGCAGATCA 282 0 

TTCTACTAAA 2 8 80 

CCCACGATAA 2 940 

TGTAATCCCA 3000 

GTTGCAGTGA 3060 

TCTCAAAAAA 312 0 

ATTAGGTTTT 3180 

GGCCCGGGCA 3240 

TTCATAGAGT 33 0 0 

ACATTGGTCT 33 60 

AAGTAATTAG 3420 

TACATGTTTA 3 480 

TTTAAAATTT 3540 

AAGAATTAAG 3 60 0 

ACTTTCTGCT 3660 

TGCCTCGCAA 3 72 0 

GTGGGCTTCA 3780 

TCAGAGCCCC 3 840 

AGGTGATAGA 3 90 0 

CCAAAGCAAA 3960 

GGCACACTGT 402 0 

GGT CCGACAC 4080 

AGATGGGGAG 4140 

AAGATCCCCT 4200 

GGGACTGAAC 42 60 

CAGGGTAGGC 432 0 

GATGCCAGGA 43 80 

CAGTTTTTTC 4440 

CCAGTTGAAT 450 0 

AGATCCTTTT 45 60 

TAAGGTTTGT 462 0 

TTAGAAGTGA 4680 

TTTTGAATTT 4740 

TACTCTAGAG 4800 
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CAGCGCTGTC CAATAGAAAT 
ACATTAAAGA AGTAAAAAGA 
C AAAAT AT C A TTTGAACATG 
TTGGTAATAC TAGTCTTCAA 
GT AC TAG C C A CATTGCAAGT 
AGCACAGTTC TAGGTTCCAC 
AG CTGG AAGT AAACATAGAG 
GTTTAAATGG CTTGCATGAG 
CCAGGCACTC TTCCCACTCC 
TGTAGAGTAG GCCGGGCGCA 
GTGGGCGGAT CACGAGGTCA 
CTCTACTGAA AATACAAAGC 
CTGCTCTGGA GGCTGAGGCA 
AGATCGCGCC ACTGCACCCC 
AAAAAAAAAA AAGAAAAGAA 
GAAGTAGACC AAAGTTTATA 
AATTATTTAT TGATCCTTGA 
AATTTAACCT TTTGAAAATA 
CTTGGAATCA AGTGAAATGA 
CAAAGACAAA CAGGAAAGTA 
AAGT GTT TAT TTACAGTGTC 
GATCTCCGTA AAATCTGGGG 
TGT TTAGTAG TGTCCAGTTT 
CATCACTGAG CCCTGGAATT 
GGCCGACATC TATGATTAGC 
CCACTTTTCT GTTTTTGTAA 
GCCTATGAGA GGCATTTATG 
TGTTTTATGA GAAATGCTTT 
GGCTTAGAGA GCTTTCCAGG 
CAGCACGGAA CATGCTTTCT 
TATTCTTGAG TTTAGATTTG 
CTCGTCTGTA TATTGGTATT 
ATTTTATAAT TACTCATTTG 
GCTCCCTTAA AA 



PCT/US02/12476 



ATAATCTGAG 
TACAAGTAGA 
TAATTAATAT 
AAT CTGGTAT 
GCTCAGTAGC 
CCTAACACGC 
ATCAAACCTC 
GTCATACAGC 
ACTACATTAC 
GTGGCT CATG 
GGAGATCGAG 
AAAATTAGCC 
GAATGGCGTG 
AGCCTGGGCG 
AAGAAAAGTC 
CCATAAGGAT 
ATCTGTAAGA 
ATAAACTTTA 
GTTATATGGT 
CAGAATAGAG 
ACGACAGAAA 
CACAGGTACA 
CAGATCATGC 
GGAGACTCAT 
TAGAAGCCAT 
TGCTTTCATT 
ATTTTTGTGC 
CCAAGGGAGG 
TGTAGTGCCA 
GAACTCACTT 
TCTTTTATAC 
TTTAAATTTT 
TAGTTTTTTT 



CCACATGTAT 
ACTAATTTTA 
AAAATTATTA 
GTAT CTTACA 
CACATGTGGC 
AAGTCCTGTG 
CTTTTAAAAA 
TAAATTCAGC 
TGTAGTGGTA 
CCTGTAATCC 
ACCATCCTGG 
AGGTGTGGTG 
AACCCAGGAG 
ACAGAGCGAG 
TAGAGAACAT 
ATTTTTCCTT 
TCAAATAACA 
AAAT AT CAGA 
CAT CACTAAA 
ACTTTTAGTA 
AGGATGTCTT 
AGAAATAGCC 
TGCCAAGAGG 
ACTTGCCCAG 
AAAGAAAAGC 
AGCAGAT CTT 
CTACAATAAG 
TCTAGGAAGA 
ATAAAAACTG 
GAGAGTGTAT 
AATTTTTAGC 
TGTGGTAAAT 
•TTTTAATTTA 



AATTTTATTT 
ATGTTTTAAT 
ATGTGATATT 
TTGATAGCAC 
TAGTGGCTAC 
GATT AG AAT C 
TGAGGACGCT 
CTCAACAGGG 
ATTCTTAGGG 
CAGCACTTTG 
CCAACATGGT 
GCGGGCGCCT 
GCAGAGATGG 
ACTCCATCTC 
TATATTAAGT 
AAATACCATG 
AGTCTCTATC 
TGTGTTATTA 
TTTAGAAATC 
AATAAATGGA 
TGTTGTCATA 
AATATTTAGT 
TATCTCCCCC 
CACAATGTTA 
TGCTAAGTGG 
TTTTTTCCAA 
TCAGCCTGTC 
TCCTGACACA 
ACCTGGAAAG 
GGTGTATGTC 
TCTTTTCCAG 
AATGAAAAGA 
ATAAACTTCC 



TCTTCTAGCC 4860 

TCAGTATATC 492 0 

TTACATTCTT 4980 

ATCTCACTTT 5040 

TGCACTGGAC 5100 

CCAGAATCAG 5160 

GAGGCACAGA 522 0 

TCTTCTGATT 52 80 

TTAAAAAAAG 5340 

GGAGGCCGAA 5400 

GAAACCCCGT 5460 

GTGGTCCCAG 5520 

CAGTGAGCCA 5580 

AAAAAAAAAA 5640 

GGTTATTATT 5700 

TTTGAAGAAC 5760 

CATGTTACCA 582 0 

CAGGATGATA 5 8 8 0 

TATTGTGAAA 5 940 

ATTTAAAAGA 60 0 0 

GTCTTTGAGG 60 60 

TCCCAGACCA 612 0 

TCAGGTGGGT 6180 

CGGGCAGACA 6240 

CCACTAGGTG 63 0 0 

GCTCCATGGG 63 60 

TGGTGTGAGT 642 0 

TAAGAACTTT 6480 

AAAACCTGCC 6540 

ACTTCTCATA 6600 

TTCACTTGTG 6660 

GTGAAATTAT 672 0 

TCCAAAAAGT 67 80 
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Seq ID NO: 166 Protein sequence : 
Protein Accession #: AAG34652 



I 

MAAEEEAAAG 
QVEDGEHQVK 
QHLRSLKGLT 
LNYDQASLTG 
YSGSRRSFFC 
NSKKDNSNFT 
LPQELLGTSC 
TNPWTKELEY 
SIGTDIANEI 
TRQNQSTVAV 
TL 



11 
I 

GKVLREENQC 
MKAFREAHSQ 
NSYVGSNYRP 
QSLFDFLHPK 
RIKSCKISVK 
CLVAIGRLQP 
YEYFHQDDHN 
IVSVNTLVLG 
LDLQRLQSSS 
HSHEPLLSDG 



21 



31 



41 



IAPWSSRVS 
TEKRRRDKMN 
SFLQDNELRH 
DVAKVKEQLS 
EEHGCLPNSK 
YIVPQNSGEI 
NLTDKHKAVL 
HSEPGEASFL 
YLDDSSPTGL 
AQLDFDAL CD 



PGTRPTAMGS 
NL I EEL SAM I 
LILKTAEGFL 
SFDISPREKL 
KKEHRKFYTI 
NVKPTEFITR 
QSKEKILTDS 
PCSSQSSEES 
MKDTHTWCR 
NDDTAMAAFM 



FSSHMTEFPR 
PQCNPMARKL 
FWGCERGKI 
IDAKTGLQVH 
HCTGYLRSWP 
FAVNGKFVYV 
YKFRAKDGSF 
SRQSCMSVPG 
SMSNKELFPP 
NYLEAEGGLG 



51 



KRKGSDSDPS 60 

DKLTVLRMAV 12 0 

LFVSKSVSKI 180 

SNLHAGRTRV 240 

PNIVGMEEER 3 00 

DQRATAI LGY 3 60 

VTLKSQWFSF 42 0 

MSTGTVLGAG 480 

SPSEMGELEA 540 

DPGDFSDIQW 60 0 



55 



Seq ID NO: 167 DNA sequence 
Nucleic Acid Accession #: NM_014400 
Coding sequence: 86-1126 



60 



65 



70 



75 



80 



85 



GGTTACTCAT 
GACGCCAAGG 
GATCTGGACT 
GTGCTACAGC 
GAAGTGCGCG 
CGGACAATTC 
CGGCCTGGAT 
CTGCAACGCC 
ATACCCGCCC 
GGGTACATCG 
CTTCGACGGC 
CTGTGTCCAG 
TGGCTCCTGT 
CCCTCGAATC 
CACATCTGTC 
GCCAGCGCCA 
GGAGCCCAGG 
TCCTGCAAAA 
ATTGGCAGCC 
AAATTTCCCT 
CCCACCACTG 
CTTCTGCTGC 
GGGTGTTCTA 
TCCTCTTGTG 
AGGATGCTAA 
GGTGGGACAA 
ATCGGTTCCC 
CTTATGTCTG 



11 

I 

CCTGGGCTCA 
GAGCAGGACG 
GCAGGCTGGC 
TGCGTGCAGA 
CCGGGCGTGG 
TCGCTGGCAG 
CTTCACGGGC 
AAGCTCAACC 
AACGGCGTGG 
CCGCCGGTCG 
AACGT CACCT 
GATGAATTCT 
TGCCAGGGGT 
CCACCCCTTG 
ACCACTTCTA 
ACCAGTCAGA 
TTGACTGGAG 
GGGGGGCCCC 
CTTCTGTTGG 
CTCACCTACT 
GACTGGGCTG 
GCTGGTTTGC 
GCTTTTTGAG 
ATGTTAGGAC 
GCTTCCTACT 
TGGCTCCCCA 
CATATGTCTT 
TGTGTGATCA 



21 



GGTAAGAGGG 
GAGCCATGGA 
TGCTGCTGCT 
AAGCAGATGA 
ACGT CTGCAC 
TGCSGGGTTG 
TTCTGGCGTT 
TCACCTCGCG 
AGTGCTACAG 
TGAG CTGCTA 
TGACGGCAGC 
GCACTCGGGA 
CCCGCTGTAA 
TCCGGCTGCC 
CCTCGGCCCC 
CTCCGAGACA 
GCGCCGCTGG 
AGCAGCCCCA 
CCGTGGCTGC 
TCTCTGGCCC 
GCCCAGCCCC 
GGCTTTGGGA 
GACAGCTCCT 
AGAGTGAGAG 
CACTTTCTCC 
CTCTAAGCAC 
CCTTACTAGA 
GTTTCTGGCA 



31 
I 

CCCGAGCTCG 
CCCCGCCAGG 
GCTGCTTCGC 
CGGATGCTCC 
CGAGGCCGTG 
CGGTTCGGGA 
CATCCAGCTG 
GGCGCTCGAC 
CTGTGTGGGC 
CAACGCCAGC 
TAATGTGACT 
TGGAGTAACA 
CTCTGACCTC 
CCCTCCAGAG 
AGTGAGACCC 
GGGAGTAGAA 
CCACCAGGAC 
TAATAAAGGC 
TGGTGTCCTA 
TGGGTACCCC 
TGTTTTTCCA 
AATAAAATAC 
GTATCCTTCT 
AAGTCAGCTG 
TAGCCAG CCT 
TGCCTCCCCT 
CTGTGAGCTC 
CATAAATGCC 



41 

I 

GAGGCGG C AC 
AAAGCAGGTG 
GGAGGAGCGC 
CCGAACAAGA 
GGGGCGGTGG 
CTCCCCGGCA 
CAGCAATGCG 
CCGGCAGGTA 
CTGAGCCGGG 
GATCATGTCT 
GTGTCCTTGC 
GGCCCAGGGT 
CGCAACAAGA 
CCCACGACTG 
ACATCCACCA 
CACGAGG CCT 
CGCAGCAATT 
TGTGTGGCTC 
CTGTGAGCTT 
TCTTCTCATC 
ACATTCCCCA 
CGTTGTATAT 
CATCCTTGTC 
TCACGGGGAA 
GGACTTTGGA 
ACTCCCCGCA 
CTCGAGGGCA 
TCAATAAAGA 



51 

I 

ACCCAGGGGG 60 

CCCAGGCCAT 12 0 

AGGCCCTGGA 180 

TGAAGACAGT 240 

AGACCATCCA 3 0 0 

AGAATGACCG 3 6 0 

CTCAGGATCG 420 

ATGAGAGTGC 480 

AGGCGTGCCA 540 

ACAAGGG CTG 60 0 

CTGTCCGGGG 660 

TCACGCTCAG 72 0 

CCTACTTCTC 780 

TGGCCTCAAC 84 0 

CCAAACCCAT 900 

CCCGGGATGA 960 

CAGGGCAGTA 1020 

CCACAGCTGG 1080 

CTCCACCTGG 1140 

ACTTCCTGTT 1200 

GTATCCCCAG 12 60 

ATTCTGGCAG 132 0 

TCTCCGCTTG 13 80 

GGTGAGAGAG 1440 

GCGTGGGGTG 1500 

TCTTTGGGGA 1560 

GGGACCGTGC 162 0 

TTTAATTACT 1680 



250 



WO 02/086443 

TTGTATAGTG AAAAAAAA 

Seq ID NO: 168 Protein sequence: 
Protein Accession #: NP_055215 

1 11 21 31 41 51 

l I I I l.l 

MDPARKAGAQ AMIWTAGWLL LLLLRGGAQA LECYSCVQKA DDGCSPNKMK TVKCAPGVDV 
CTEAVGAVET IHGQFSLAVX GCGSGDPGKN DRGLDLHGLL AFIQLQQCAQ DRCNAKLNLT 
SRALDPAGNE SAYPPNGVEC YSCVGIjSREA CQGTSPPWS CYNASDHVYK GCFDGNVTl>T 
AANVTVSLPV RGCVQDEFCT RDGVTGPGFT LSGSCCQGSR CNSDLRNKTY FSPRIPPLVR 
LPPPEPTTVA STTSVTTSTS APVRPTSTTK PMPAPTSQTP RQGVEHEASR DEEPRLTGGA 
AGHQDRSNSG QYPAKGGPQQ PHNKGCVAPT AGLAALLLAV AAGVLL 

Seq ID NO: 169 DNA sequence 
Nucleic Acid Accession #: NM_006875 
Coding sequence: 186-1190 

1 11 21 ■ 31 41 51 

I l I I I l 

GAATT CGGCA CGAGCGCGCG GCGAATCTCA ACGCTGCGCC GTCTGCGGGC GCTTCCGGGC 
CACCAGTTTC TCTGCTTTCC ACCCTGGCGC CCCCCAGCCC TGGCTCCCCA GCTGCGCTGC 
CCCGGGCGTC CACGCCCTGC GGGCTTAGCG GGTTCAGTGG GCTCAATCTG CGCAGCGCCA 
CCTCCATGTT GACCAAGCGT CTACAGGGGC CTCCCGCGCC CCCCGGGACC CCCACGCCGC 
CGCCAGGAGG CAAGGATCGG GAAGCGTTCG AGGCCGAGTA TCGACTCGGC CCCCTCCTGG 
GTAAGGGGGG CTTTGGCACC GTCTTCGCAG GACACCGCCT CAC AG AT CG A CTCCAGGTGG 
CCATCAAAGT GATTCCCCGG AATCGTGTGC TGGGCTGGTC CCCCTTGTCA GACTCAGTCA 
CATGCCCACT CGAAGTCGCA CTGCTATGGA AAGTGGGTGC AGGTGGTGGG CACCCTGGCG 
TGATCCGCCT GCTTGACTGG TTTGAGACAC AGGAAGGCTT CATGCTGGTC CTCGAGCGGC 
CTTTGCCCGC CCAGGATCTC TTTGACTATA TCACAGAGAA GGGCCCACTG GGTGAAGGCC 
CAAGCCGCTG CTTCTTTGGC CAAGTAGTGG CAGCCATCCA GCACTGCCAT TCCCGTGGAG 
TTGTCCATCG TGACATCAAG GATGAGAACA TCCTGATAGA CCTACGCCGT GGCTGTGCCA 
AACTCATTGA TTTTGGTTCT GGTGCCCTGC TTCATGATGA ACCCTACACT GACTTTGATG 
GGACAAGGGT GTACAGCCCC CCAGAGTGGA TCTCTCGACA CCAGTACCAT GCACTCCCGG 
CCACTGTCTG GTCACTGGGC ATCCTCCTCT ATGACATGGT GTGTGGGGAC ATTCCCTTTG 
AGAGGGACCA GGAGATTCTG GAAGCTGAGC TCCACTTCCC AGCCCATGTC TCCCCAGACT 
GCTGTGCCCT AATCCGCCGG TGCCTGGCCC CCAAACCTTC TTCCCGACCC T C ACT GG AAG 
AGATCCTGCT GGACCCCTGG ATGCAAACAC CAGCCGAGGA TGTTACCCCT CAACCCCTCC 
AAAGGAGGCC CTGCCCCTTT GGCCTGGTCC TTGCTACCCT AAGCCTGGCC TGGCCTGGCC 
TGGCCCCCAA TGGTCAGAAG AGCCATCCCA TGGCCATGTC ACAGGGATAG ATGGACATTT 
GTTGACTTGG TTTTACAGGT CATTACCAGT CATTAAAGTC CAGTATTACT AAGGTAAGGG 
ATTGAGGATC AGGGGTTAGA AGACATAAAC CAAGTTTGCC CAGTTCCCTT CCCAATCCTA 
CAAAGGAGCC TTCCTCCCAG AACCTGTGGT CCCTGATTTT GGAGGGGGAA CTTCTTGCTT 
CTCATTTTGC TAAGGAAGTT TATTTTGGTG AAGTTGTTCC CATTTTGAGC CCCGGGACTC 
TTATTTTGAT G ATGTGT CAC CCCACATTGG CACCTCCTAC TACCACCACA CAAACTTAGT 
TCATATGCTT TTACTTGGGC AAGGGTGCTT TCCTTCCAAT ACCCCAGTAG CTTTTATTTT 
AGTAAAGGGA CCCTTTCCCC TAGCCTAGGG TCCCATATTG GGTCAAGCTG CTTACCTGCC 
TCAGCCCAGG ATTTTTTATT TTGGGGGAGG TAATGCCCTG TTGTTACCCC AAGGCTTCTT 
TTTTTTTTTT TTTTTTTTTG GGTGAGGGGA CCCTACTTTG TTATCCCAAG TGCTCTTATT 
CTGGTGAGAA GAACCTTAAT TCCATAATTT GGGAAGGAAT GGAAGATGGA CACCACCGGA 
CACCACCAGA CAATAGGATG GGATGGATGG TTTTTTGGGG GATGGGCTAG GG GAAATAAG 
GCTTGCTGTT TGTTTTCCTG GGGCGCTCCC TCCAATTTTG CAGATTTTTG CAACCTCCTC 
CTGAGCCGGG ATTGTCCAAT TACTAAAATG TAAATAATCA CGTATTGTGG GGAGGGGAGT 
TCCAAGTGTG CCCTCCTTTT TTTTCCTGCC TGGATTATTT AAAAAGCCAT GTGTGGAAAC 
CCACTATTTA ATAAAAGTAA TAGAATCAGA AAAAAAAAAA AAAAAAAA 



Seq ID NO: 170 Protein sequence: 
Protein Accession #: NP_006866 

1 11 21 31 41 51 

I I I I i I 

MLTKPLQGPP APPGTPTPPP GGKDREAFEA EYRLGPLLGK GGFGTVFAGH RLTDRLQVAI 

KV I PRNRVLG WSPLSDSVTC PLEVALLWKV GAGGGHPGVI RLLDWFETQE GFMLVLERPL 

PAQDLFDYIT EKGPLGEGPS RCFFGQWAA IQHCHSRGW HRDIKDENIL IDLRRGCAKL 

IDFGSGALLH DEPYTDFDGT RVYSPPEWIS RHQYHALPAT VWSLGILLYD MVCGDIPFER 

DQEILEAELH FPAHVSPDCC AuIRRCtiAPK PSSRPSLEEI LLDPWMQTPA EDVTPQPLQR 

RPCPFGLVLA TLSLAWPGLA PNGQKSHPMA MSQG 

Seq ID NO: 171 DNA sequence 
Nucleic Acid Accession #: NM_003646 
Coding sequence: 89.. 2875 

1 11 21 31 41 51 

I I I I I I 

GCGGCGCGGA GCGGGCGTGC TGAGCCCCGG CCGCCGGCCC GGCATGGGCG TCTCCCGCGG 
GCCCTCCGCC GGCCGGGGCT AGGGCCGGAT GGAGCCGCGG GACGGTAGCC CCGAGGCCCG 
GAGCAGCGAC TCCGAGT CGG CTTCCGCCTC GTCCAGCGGC TCCGAGCGCG ACGCCGGTCC 
CGAGCCGGAC AAGGCGCCGC GGCGACTCAA CAAGCGGCGC TTCCCGGGGC TGCGGCTCTT 
CGGGCACAGG AAAGCCATCA CCAAGT CGGG CCTCCAGCAC CTGGCCCCCC CTCCGCCCAC 
CCCTGGGGCC CCGTGCAG CG AGTCAGAGCG GCAGAT CCGG AGTACAGTGG ACTGGAGCGA 
GTCAG CGACA TATGGGGAGC ACATCTGGTT CGAGACCAAC GTGTCCGGGG ACTTCTGCTA 
CGTTGGGGAG CAGTACTGTG TAGCCAGGAT GCTGAAGTCA GTGTCTCGAA GAAAGTGCGC 
AGCCTGCAAG ATTGTGGTGC ACACGCCCTG CATCGAGCAG CTGGAGAAGA TAAATTTCCG 
CTGTAAGCCG TCCTTCCGTG AATCAGGCTC CAGGAATGTC CGCGAGCCAA CCTTTGTACG 
GCACCACTGG GTACACAGAC GACGCCAGGA CGG CAAGTGT CGGCACTGTG GGAAGGGATT 
CCAGCAGAAG TTCACCTTCC ACAGCAAGGA GATTGTGGCC ATCAGCTGCT CGTGGTGCAA 
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GCAGGCATAC CACAGCAAGG 
GCTGGGGGTC CACGCAGCCG 
CCAGAATACT CTGAAAGCAA 
CAAGAAAGGG CCTGAGGAGG 
GCTCATGAAG CCCCTGCTGG 
GAT CATCCAG TCTTTCCTCT 
AGGGCCCAAG GAGGCGCTGG 
CGGGGG CG AC GGCACGGTGG 
GCCACCCCCT GTTGCC AT CC 
CTGGGGTGGG GGCTACACAG 
GAACGTGGTA CAGCTGGACC 
TGAGGACCGA GATGAAGGCG 
CAGCCTGGGC TTTGACGCCC 
AGAGAAATTC AACAGCCGCT 
CTTCCTGATG GGCAGCTCCA 
GGACTTGACT CCCAAGATCC 
CAGGTACTGT GCGGGCACCA 
CCAGCGGCAT GACGACGGCT 
GCTGCAGGTG GGCGGACACG 
ATCCAAGGCC ATCCCGGTGC 
CCGCATCGCC CTGCGCAACC 
CCCCCTGCAC AGCGACCAGC 
CAGCATGCAC GACTATGAGG 
GCCGCTGGGC ACTGTGGTGG 
TGAGAGACTC CAGCAGGAGC 
GTCCCCCAAG TGGTGCTTCC 
AG CC CAGGAG CACCTCAACT 
CCCTGAGCTG CTGGGGGCAT 
CACCTCACCC TGCTCACCCA 
TGAAGAGCTG ATTGAGGCTG 
AGCTGGGGGC GACCTCATGC 
CAGCACTGGC AGCAAGGATG 
TGATGCGGTG GAGGAAAACG 
CACCATCTGC CACTACATCG 
CGACACTCCC CGGCAGCGGG 
GAACCGGCAG CACTACCAGA 



PCT/US02/12476 



TGTCCTGCTT 
TGGTCATCCC 
GCAAGAAGAA 
GCCGCTGGAG 
TGTT TGTGAA 
GGTATCTCAA 
AGATGTACCG 
GCTGGATCCT 
TGCCCCTGGG 
ATGAGCCTGT 
GCTGGGACCT 
CCACCGACCG 
ACGTCACCCT 
TTCGGAATAA 
AGGACCTGGC 
AGGACCTGAA 
TGCCCTGGGG 
ACCTCGAGGT 
GCGAGCGGCT 
AGGTGGATGG 
AGGCCACCAT 
AGCCGGTGCC 
CCCTGCACTA 
TCCCAGGAGA 
CCGATGGTGC 
TGGACGCCAC 
ATGTGACTGA 
CGGCCCGGCC 
CGCCCCGGTC 
CCAAGAGGAA 
ACCGAGACGA 
TGGTCCGCTA 
GGGAGACCTG 
TGGAGGCCGG 
CTGAGAAGGC 
TGATCCAGCG 



CATGCTGCAG 
GCCCACCTGG 
GAAGAGGGCA 
ACCCTTCATC 
CCCCAAGAGT 
TCCCCGACAA 
CAAAGTGCAC 
CTCCACCCTG 
TACTGGCAAC 
GTCCAAGATC 
CCACGCTGAG 
GTTGCCCCTG 
GGAGTTCCAC 
GATGTTCTAC 
CAAGCACATC 
ACCCCAGTGT 
CCACCCTGGG 
CATTGGCTTC 
GACGCAGTGT 
CGAGCCCTGC 
GGTGCAGAAG 
AGAGCAGTTG 
CGACAAGGAG 
CAGTGACCTA 
TGGAGCCAAG 
CACTGCCAGC 
GAT CGCACAG 
TGACCTCCCA 
ACTGCAAGGG 
CGACTTCTGT 
GCAGAGTCGC 
CCTGCTGGAC 
TTTGCACCAA 
GGCCTCGCTC 
TCAGGACACC 
GGAGGACCAG 



CAGATCGAGG 
ATCCTCCGCG 
TCCTTCAAGA 
ATCAGGCCCA 
GGGGGCAACC 
GTCTTCGACC 
AACCTGCGGA 
GACCAGCTAC 
GACTTGGCCC 
CTCTCCCACG 
CCCAACCCCG 
GATGTCTTCA 
GAGTCTCGAG 
GCCGGGACAG 
CGAGTGGTGT 
GTTGTTTTCC 
GAGCACCACG 
ACCATGACGT 
CGCGAGGTGG 
AAGCTTGCAG 
GCCAAGCGGC 
CGCATCCAGG 
CAGCTCAAGG 
GAGCTCTGCC 
TCCCCGACAT 
CGCTTCTACA 
GATGAGATTT 
ACCCCCACTT 
GATGCTGCAC 
AAGCTCCAGG 
ACGCTCCTGC 
CACGCCCCCC 
GCAGCGGCCC 
ATGAAGACAG 
GAGCTGGCCG 
GAGACGGCTG 



AGCCGTGCTC 78 0 

CCCGGAGGCC 840 

GGAAGTCCAG 900 

CCCCCTCCCC 960 

AGGGTGCAAA 102 0 

TGAGCCAGGG 1080 

TCCTGGCGTG 1140 

GCCTGAAGCC 12 00 

GAACCCTCAA 1260 

TGGAGGAGGG 132 0 

AGGCAGGGCC 13 80 

ACAACTACTT 144 0 

AGGCCAACCC 1500 

CTTTCTCTGA 1560 

GTGATGGAAT 162 0 

TGAACATCCC 1680 

ACTTTGAGCC 1740 

CGTTGGCCGC 180 0 

TGCTCACCAC 1860 

CCTCACGCAT 1920 

GGAGCGCCGC 1980 

TGAGTCGCGT 2 040 

AGGCCTCTGT 210 0 

GTGCCCACAT 2160 

GCCAGAAACT 222 0 

GGATCGACCG 22 8 0 

ATATCCTGGA 2340 

CCCCTCTCCC 2400 

CCCCTCAAGG 2460 

AGCTGCACCG 2 52 0 

ACCACGCAGT 2580 

CAGAGATCCT 2 640 

TGGGCCAGCG 2 70 0 

ACCAGCAGGG 2760 

CCTACCTGGA 2820 

TGTAGCGGGC 2880 



40 



Seq ID NO: 172 Protein sequence: 
Protein Accession #: NP 003637 



45 



50 



55 



60 



MEPRDGSPEA 
GLQHLAPPPP 
MLKSVSRRKC 
DGKCRHCGKG 
PPTVJ I LRARR 
NPKSGGNQGA 
LSTLDQLRIiK 
LHAEPNPEAG 
KMFYAGTAFS 
GHPGEHHDFE 
GEPCKLAASR 
YDKEQLKEAS 
TTASRFYRID 
SLQGDAAPPQ 
YLLDHAPPEI 
AQDTELAAYL 



11 
1 

RSSDSESASA 
TPGAPCSESE 
AACKIWHTP 
FQQKFTFHSK 
PQNTLKASKK 
KIIQSFLWYL 
PPPPVAILPL 
PEDRDEGATD 
DFLMGSSKDL 
PQRHDDGYLE 
IRIALRNQAT 
VPLGTWVPG 
RAQEHLNYVT 
GEELt I E AAKR 
LDAVEENGET 
ENRQHYQMIQ 



21 

i 

SSSGSERDAG 
RQIRSTVDWS 
CIEQLEKINF 
EIVAISCSWC 
KKRASFKRKS 
NPRQVFDLSQ 
GTGNDLARTL 
RLPLDVFNNY 
AKHIRWCDG 
VIGFTMTSLA 
MVQKAKRRSA 
DSDLELCRAH 
EIAQDEIYIL 
NDFCKLQELH 
CLHQAAALGQ 
REDQETAV 



31 
1 

PEPDKAPRRL 
ESATYGEHIW 
RCKPSFRESG 
KQAYHSKVSC 
SKKGPEEGRW 
GGPKEALEMY 
NWGGGYTDEP 
FSLGFDAHVT 
MDLTPKIQDL 
ALQVGGHGER 
APLHSDQQPV 
IERLQQEPDG 
DPELLGASAR 
RAGGDLMHRD 
RTICHYIVEA 



41 

I 

NKRRFPGLRL 
FETNVSGDFC 
SRNVREPTFV 
FMLQQIEEPC 
RPFIIRPTPS 
RKVHNLRILA 
VSKILSHVEE 
LEFHESREAN 
KPQCWFLNI 
LTQCREWLT 
PEQLRIQVSR 
AGAKSPTCQK 
PDLPTPTSPL 
EQSRTLLHHA 
GASLMKTDQQ 



51 
1 

FGHRKAI TKS 60 

YVGEQYCVAR 12 0 

RHHWVHRRRQ 180 

SLGVHAAW I 240 

PLMKPLLVFV 300 

CGGDGTVGWI 3 60 

GNWQLDRWD 420 

PEKFNSRFRN 480 

PRYCAGTMPW 540 

TSKAIPVQVD 600 

VSMHDYEALH 660 

L.SPKWCFIiDA 720 

PTSPCSPTPR 780 

VSTGSKDWR 84 0 

GDTPRQRAEK 900 



Seq ID NO: 173 DNA sequence 
Nucleic Acid Accession #: AF232772 
Coding sequence: 1-1662 



65 



70 



75 



80 



85 



ATGCCGGTGC 
GTGCTGGGTG 
CACTACCTGT 
CTTTTTGCCT 
TCCCCGCGGC 
TTGCGCAAGT 
GTGGTGGATG 
GGCGGCACCG 
GGTGAGACGG 
AGCACCTTCT 
TTCAAGGCCC 
GATCCAGCCT 
GTCGGGGGAG 
GTGCGGTACT 
CAGTGTATTA 
GACTGGTACC 
ACCAACCGAG 
ACAGAGACCC 
TACTTCCGGG 
TACGAGTCAG 
TTCTACCGGG 
ATTATCAAGG 



11 
I 

AGCTGACGAC 
GCATCCTGGC 
CCTTCGGCCT 
TCCTGGAGCA 
GGGGCTCGGT 
GCCTGCGCTC 
GCAACCGCCA 
AGCAGGCCGG 
AGGCCAGCCT 
CGTGCAT CAT 
TCGGCGATTC 
GCACCATCGA 
ATGTCCAGAT 
GGATGGCCTT 
GTGGGCCCTT 
ATCAGAAGTT 
TCCTGAGCCT 
CCACTAAGTA 
AGTGGCTCTA 
TGGTCACGGG 
GCCGCATCTG 
CCACCTACGC 



21 



AGCCCTGCGT 
AGCCTATGTG 
GTACGGCGCC 
CCGGCGCATG 
GGCACTGTGC 
GGCCCAGCGC 
GGAGGACGCC 
CTTCTTTGTG 
GCAGGAGGGC 
GCAGAAGTGG 
GGTGGACTAC 
GATGCTTCGA 
CCTCAACAAG 
CAACGTGGAG 
GGGCATGTAC 
CCTAGGCAGC 
TGGCTACCGA 
CCTCCGGTGG 
CAACTCTCTG 
TTTCTTCCCC 
GAACATTCTC 
CTGCTTCCTT 



31 
I 

GTGGTGGGCA 
ACGGGCTACC 
ATCCTGGGCC 
CGACGTGCCG 
ATTGCCGCAT 
ATCTCCTTCC 
TACATGCTGG 
TGGCGCAGCA 
ATGGACCGTG 
GGAGGCAAGC 
AT CCAGGTGT 
GTCCTGGAGG 
TACGACTCAT 
CGGGCCTGCC 
CGCAACAGCC 
AAGTGCAGCT 
ACTAAGTATA 
CTCAACCAGC 
TGGTTCCATA 
TTCTTCCTCA 
CTCTTCCTGC 
CGGGGCAATG 



41 
I 

CCAGCCTGTT 
AGTT CATCCA 
TGCACCTGCT 
GCCAGGCCCT 
ACCAGGAGGA 
CTGACCTCAA 
ACATCTTCCA 
ACTTCCATGA 
TGCGGGATGT 
GCGAGGTCAT 
GCGACTCTGA 
AGGATCCCCA 
GGATTTCCTT 
AGTCCTACTT 
TCCTCCAGCA 
TCGGGGATGA 
CCGCGCGCTC 
AAACCCGCTG 
AGCACCACCT 
TTGCCACGGT 
TGACGGTGCA 
CAGAGATGAT 



51 
I 

TGCCCTGGCA 60 

CACGGAAAAG 120 

CATTCAGAGC 180 

GAAGCTGCCC 240 

CCCTGACTAC 3 00 

GGTGGTCATG 3 60 

CGAGGTGCTG 420 

GGCAGGCGAG 480 

GGTGCGGGCC 540 

GTACACGGCC 600 

CACTGTGCTG 660 

AGTAGGGGGA 720 

CCTGAGCAGC 780 

TGGCTGTGTG 840 

GTTCCTGGAG 900 

CCGGCACCTC 960 

CAAGTGCCTC 1020 

GAGCAAGTCT 10 80 

CTGGATGACC 1140 

TATACAGCTT 1200 

GCTGGTGGGC 1260 

CTTCATGTCC 132 0 



252 



WO 02/086443 

CTCTACTCCC TCCTCTATAT GTCCAGCCTT 
ATCAACAAAT CTGGCTGGGG CACCTCTGGC 
CTCATTCCTG TGTCCATCTG GGTGGCAGTT 
TGCCAGGACC TGTTCAGTGA GACAGAGCTA 
GGCTGCTACT GGGTGGCCCT CCTCATGCTA 
AAGAAGCCGG AGCAGTACAG CTTGGCTTTT 
CGGGTAAAGT GCAATGGGTA AGGGAGGGAA 
GGGAGGAGGG AGTGCTGTGT TTTAGTCTCT 
AAGAACGGTG ATGTAGTATG GCCTGACAGC 
AGATGCAGGG CTGCAGGGGA TTCTGTGTTT 
TAGGCAGTAG CCTCCTCCTG GGCTCCAGAG 
AGTCCCATTC AGTGGCAACT TGTGATAGGT 
TTCTCCCAGC CCATCTGAAC ACAACCAGAG 
GGCCGGTTAG TGTATGTCAC CCCCACCCCA 
GCGCGTGAGA TACAAGGCCC AGAAGCCTGA 
ATGGTGCTTT ATGTGAGATA CCCCACTCCA 
CAGGGAGTTA GCACTGAACT GCTTTTAAAA 
GGAACAAAGA GATTGTGGTG GTGCTAAAGG 
TTCCACCTGG AAACTGCTCA GACGTCTAGA 
GGGGAGATAA AAAGATTAAG CCCCAACATG 
TAACCTGTAT ACTCTTGAAT TCCTCTCAAA 
CCCCACTTCA CTTTCTTCAA AGCCACATTT 
CCCTCATCAT CATAGGTAAG GTTTTCAAGG 
TAGAAGCTTC AGCAGGAGGC AAGCGTGTTC 
TGATCAAATT GGCTACAATC TTGGAGCTGC 
ATGTGTGACT TTCAGGCTAC TGTTCTTGAC 
TCCCAAAGTG AACTCTCAAA TCCAAAATGG 
GGCTTCTCCA GGGAATTCTT ACAGCCAAGT 
TCCAGAAACC AAACTAGGAG ATGAAACTGG 
CTCATGCCTC CTGAGGCTGT TTTTGGCTGT 
GAAGCCATTT TCCAAGTGAC TTGCAATCCA 
TGGGATCCTG ACTAAGCCTT TGACTTAAGG 
TCAAAGGGGC CAACTAACCC GTGCAGAACC 
AAGCCTCTAA TGTACCAAGT GCTTCCTACA 
GGGCAAACCC TGGTGCTTTC CTTCATCTCC 
AACAGTTGCC ACATCACACA GACCTCCAGT 
CCAACCCATT GAAGGCTGGA AGGCAGCAGG 
GTTCTGCTGG CCAAGAAGTT AAACTATTTT 
CAAGTGCAGA GTTCAGACTT CGCTAAGGGC 
AATGTAGGAT GACAGGCTCT CCTGGCTGTC 
GTCAACTTTC CTCAAATCAA AAACAGGCAG 
TCGACTGGTT TTTCTAAGTT ATTTTGTACA 
CAGCTTTATC CCCGTTTCTT GCAAGGGAAG 
TTTCCTCATT GAGAATTCAA ATCCTCTTTT 
TTTATTTTTA CCTGCTTTTT TTTTTTTTTT 
CTTATTTGTC AAAATAAAGA TTCTCACAT 



CTGCCGGCCA AGATCTTTGC CATTGCTACC 
CGAAAAACCA TTGTGGTGAA CTTCATTGGC 
CTCCTGGAGG GGCTGGCCTA CACAGCTTAT 
GCCTTCCTTG .TCTCTGGGGC TATACTGTAT 
TATCTGGCCA TCATCGCCCG GCGATGTGGG 
GCTGAGGTGT GACATGGCCC CCAAGCAGAG 
GGGGAATGGA AGAGAAAAGA CAGGGTGGGA 
T AATGGT CCA AAGGACAAAT CTAAAATGCA 
TCTGTTTAGA GGAGGCAACA CTGATCCCCC 
TCAGACTGCC TGTCTGCTTG CATCTGCACA 
GGCACTCAGA AGTTGTGCTA AACCAAGTTA 
ACCTGAGTGA CGGCAACCTG CGGAAGGAGG 
GTGGCAGGAG AATTTCTACT GAGCGAGGTG 
CCCATAAGTA GTCAT CAATG CAATAAGATT 
TCTTTGGGCA TCAGAAAACA GGGT CCAGGA 
CATCAACATT CCAGGGATGA GCCAAACCAG 
GTGCACATTA AAAAGGAAAG TTTGCCAGGA 
AGGCCATAAG CTACACAGAG GCCTTGGGTG 
TGGGTTCTTA GCTTGTCTGT GATCTCTGCT 
TTCAGAAAAG AAGTGAAGTC TTGGGTATTT 
TTCAGCTCTG ATCTGAGGCT AAGACACACT 
TTTGAGGTAT CACTGCAGTC ACCTCTTCTA 
TGGCAATTGG GGCGGAGCCC CGGCTTCTTA 
TCAGCACATA TGGGAACTAT GAGGAGCCTC 
TTGGACGGAT TCCTTGGCAG CCGGGTTAGC 
AATCATCTCC AATGGAAAGC TTTTCAGTGT 
TTATCTTTGA GACCATCCAT TCTCCTCAGT 
TGTGACAGTC ACTGCATTTG CCTGCTTCTT 
TTCCTACATC CTAAGGTTCT TGCTTTCTCT 
TTTCCCTCTG CTGCTTTTGG GGAAT GAG GG 
GGCTGTTCTC AGCGTTTTGA GTTTAAAACC 
GTTGCTTGCT TGCCCTCCAA ATGTCCTTTC 
AGCACTAAGG TGGACAGCAG ACAAGAGGGC 
AAGACGCAAG GTGTGCTCCG AACCACAGAT 
CACGAACTCA AGGGTTTTCC AAGTGTAGCT 
TTCTGGTAAG ACTGCTGGTT G ACAT C AG AC 
CATTTGCTAA GGCAGCTGAT CCAGGCAATC 
GAGCATTAGA ATGGAGGAAA TCCGGTCAGC 
TTGTTTTTCT TCAGCATTTA CTTGAAGATT 
CTAC CAT C AG CTCTGCCTTG CACTGTGGTC 
GTACAGGTAG TGGGCTCACA ACGTTTGACC 
TTTTTCAGCA GCAAAACCAA ACTGGGTCTT 
AGCCTTTATA CAATTGGACG CATTTTGGTT 
GTATTGTTTC TACAATAAT T TGTAAACATA 
TAATTTTCAG GTCAAGTTTT TTATACTGCA 



Seq ID NO: 174 Protein sequence: 
Protein Accession #: AAF36984 



1 

I 

MPVQLTTALR 
LFAFLEHRRM 
WDGNRQEDA 
STFSCIMQKW 
VGGDVQ I LiNK 
DWYHQKFLGS 
YFREWLYNSL 
I IKATYACFL 
LIPVSIWVAV 
KKPEQYSLAF 



11 

I 

WGTSLFALA 
RRAGQALKLP 
YMLDIFHEVL 
GGKREVMYTA 
YDSWISFLSS 
KCSFGDDRHL 
WFHKHHIiWMT 
RGNAEMIFMS 
LLEGL.AYTAY 
AEV 



21 

1 

VLGGILAAYV 
SPRRGSVALC 
GGTEQAGFFV 
FKALGDSVDY 
VRYWMAFNVE 
TNRVLSLGYR 
YESWTGFFP 
LYSLLYMSSL 
CQDLFSETEL 



31 
I 

TGYQFIHTEK 
IAAYQEDPDY 
WRSNFHEAGE 
IQVCDSDTVL 
RACQSYFGCV 
TKYTARSKCL 
FFLIATVIQL 
LPAKIFAIAT 
AFLVSGAILY 



41 

I 

HYLSFGLYGA 
LRKCLRSAQR 
GETEASLQEG 
DPACTIEMLR 
QCISGPLGMY 
TETPTKYLRW 
FYRGRIWNIL 
INKSGWGTSG 
GCYWVALLML 



51 
I 

ILGLHLLIQS 
I SFPDLKWM 
MDRVRDWRA 
VLEEDPQVGG 
RNSDLQQFLE 
LNQQTRWSKS 
LFLLTVQLVG 
RKTIWNFIG 
YLAI I ARRCG 



Seq ID NO: 175 DNA sequence 
Nucleic Acid Accession #: NM_000691 
Coding sequence: 43.. 1404 



1 11 21 31 41 51 

1)1111 

CCAGGAGCCC CAGTTACCGG GAGAGGCTGT GTCAAAGGCG CCATGAGCAA GAT CAGCGAG 
GCCGTGAAGC GCGCCCGCGC CGCCTTCAGC TCGGGCAGGA CCCGTCCGCT GCAGTTCCGA 
TTCCAGCAGC TGGAGGCGCT GCAGCGCCTG ATCCAGGAGC AGG AG CAGG A GCTGGTGGGC 
GCGCTGGCCG CAGACCTGCA CAAGAATGAA TGGAACGCCT ACTATGAGGA GGTGGTGTAC 
GTCCTAGAGG AGATCGAGTA CATGATCCAG AAGCTCCCTG AGTGGGCCGC GGATGAGCCC 
GTGGAGAAGA CGCCCCAGAC TCAGCAGGAC GAGCTCTACA TCCACTCGGA GCCACTGGGC 
GTGGTCCTCG TCATTGGCAC CTGGAACTAC CCCTTCAACC TCACCATCCA GCCCATGGTG 
GGCGCCATCG CTGCAGGGAA CGCAGTGGTC CTCAAGCCCT CGGAGCTGAG TGAGAACATG 
GCGAGCCTGC TGGCTACCAT CATCCCCCAG TACCTGGACA AGGATCTGTA CCCAGTAATC 
AATGGGGGTG TCCCTGAGAC CACGGAGCTG CTCAAGGAGA GGTTCGACCA TATCCTGTAC 
ACGGGCAGCA CGGGGGTGGG G AAGAT CATC ATGACGGCTG CTGCCAAGCA CCTGACCCCT 
GTCACGCTGG AGCTGGGAGG GAAGAGTCCC TGCTACGTGG ACAAGAACTG TGACCTGGAC 
GTGGCCTGCC GACG CAT CG C CTGGGGGAAA TTCATGAACA GTGGCCAGAC CTGCGTGGCC 
CCAGACTACA TCCTCTGTGA CCCCTCGATC CAGAACCAAA TTGTGGAGAA GCTCAAGAAG 
TCACTGAAAG AGTTCTACGG GGAAGATGCT AAGAAATCCC GGGACTATGG AAGAATCATT 
AGTGCCCGGC ACTTCCAGAG GGTGATGGGC CTGATTGAGG GCCAGAAGGT GGCTTATGGG 
GGCACCGGGG ATGCCGCCAC TCGCTACATA GCCCCCACCA TCCTCACGGA CGTGGACCCC 



1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
378Q 
3840 
3900 
3960 
4020 



60 
120 
180 
240 
300 
360 
420 
480 
540 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 



253 



WO 02/086443 

CAGTCCCCGG TGATGCAAGA GGAGAT CTTC GGGGCTGTGC TGCCCATCGT GTGCGTGCGC 1080 

AGCCTGGAGG AGGCCAT CCA GTTCAT CAAC CAGCGTGAGA AGCCCCTGGC CCTCTACATG 1140 

TTCTCCAGCA ACGACAAGGT GATTAAGAAG ATGATTGCAG AG AC AT C C AG TGGTGGGGTG 12 00 

GCGGCCAACG ATGTCAT CGT CCACATCACC TTGCACTCTC TGCCCTTCGG GGGCGTGGGG 1260 

AACAGCGGCA TGGGATCCTA CCATGGCAAG AAGAGCTTCG AGACTTTCTC TCACCGCCGC 1320 

TCTTGCCTGG TGAGGCCTCT GATGAATGAT GAAGGCCTGA AGGTCAGATA CCCCCCGAGC 1380 

CCGGCCAAGA TGACCCAGCA CTGAGGAGGG GTTGCTCCGC CTGGCCTGGC CATACTGTGT 1440 

CCCATCGGAG TGCGGACCAC CCTCACTGGC TCTCCTGGCC CTGGAGAATC GCTCCTGCAG 1500 

CCCCAGCCCA GCCCCACTCC TCTGCTGACC TGCTGACCTG TGCACACCCC ACTCCCACAT 1560 

GGGCCCAGGC CTCACCATTC CAAGTCTCCA CCCCTTTCTA GACCAATAAA GAGACAAATA 162 0 
CAATTTTCTA ACTCGG 

Seq ID NO: 176 Protein sequence: 
Protein Accession #: NP_000682 

1 11 21 31 41 51 

I ! I I I I 

MSKISEAVKR ARAAFSSGRT RPLQFRFQQL EALQRLIQEQ EQELVGALAA DLHKNEWNAY 60 

YEEWYVLEE IEYMIQKLPE WAADEPVEKT PQTQQDELYI HSEPLGWLV IGTWNYPFNL 120 

TIQPMVGAIA AGNAWLKPS ELSENMASLIi ATIIPQYLDK DLYPVINGGV PETTELLKER 180 

FDHILYTGST GVGKI IMTAA AKHLTPVTLE LGGKSPCYVD KNCDLDVACR RIAWGKFMNS 2 40 

GQTCVAPDYI LCDPSIQNQI VEKLKKSLKE FYGEDAKKSR DYGRI ISARH FQRVMGLIEG 300 

QKVAYGGTGD AATR Y I APT I LTDVDPQSPV MQEEIFGPVL PIVCVRSIiEE AIQFINQREK 3 60 

PL Ab YMF S SN DKVIKKMIAE TSSGGVAAND VIVHITLHSL PFGGVGNSGM GSYHGKKSFE 420 
TFSHRRSCLV RPLMNDEGLK VRYPPSPAKM TQH 

Seq ID NO: 177 DNA sequence 

Nucleic Acid Accession #: NM_001067.1 

Coding sequence: 108-4703 

1 11 21 31 41 51 

I I l l I I 

CTAACCGACG CGCGTCTGTG GAGAAGCGGC TTGGTCGGGG GTGGTCTCGT GGGGTCCTGC 60 

CTGTTTAGTC GCTTTCAGGG TTCTTGAGCC CCTTCACGAC CGTCACCATG GAAGTGTCAC 120 

CATTGCAGCC TGTAAATGAA AATATGCAAG TCAACAAAAT AAAGAAAAAT GAAGATGCTA 180 

AGAAAAGACT GTCTGTTGAA AGAAT CTATC AAAAGAAAAC ACAATTGGAA CATATTTTGC 240 

TCCGCCCAGA CACCTACATT GGTTCTGTGG AATTAGTGAC CC AG CAAATG TGGGTTTACG 300 

ATGAAGATGT TGGCATTAAC TATAGGGAAG TCACTTTTGT TCCTGGTTTG TACAAAATCT 3 60 

TTGATGAGAT TCTAGTTAAT GCTGCGGACA ACAAACAAAG GGACCCAAAA ATGTCTTGTA 42 0 

TTAGAGTCAC AATTGATCCG GAAAACAATT TAATTAGTAT ATGGAATAAT GGAAAAGGTA 480 

TTCCTGTTGT TGAACACAAA GTTGAAAAGA TGTATGTCCC AGCTCTCATA TTTGGACAGC 540 

TCCTAACTTC TAGTAACTAT GATGATGATG AAAAGAAAGT GACAGGTGGT CGAAATGGCT 600 

ATGGAGCCAA ATTGTGTAAC ATATTCAGTA CCAAATTTAC TGTGGAAACA GCCAGTAGAG 660 

AATACAAGAA AATGTTCAAA CAGACATGGA TGGATAATAT GGGAAGAGCT GGTGAGATGG 72 0 

AACTCAAGCC CTTCAATGGA G AAG AT TATA CAT GT AT C AC CTTTCAGCCT GATTTGTCTA 780 

AGTTTAAAAT GCAAAGCCTG GACAAAGATA TTGTTGCACT AATGGTCAGA AGAGCATATG 840 

ATATTGCTGG ATCCACCAAA GATGTCAAAG TCTTTCTTAA TGGAAATAAA CTGCCAGTAA 90 0 

AAGGATTTCG TAGTTATGTG GACATGTATT TGAAGGACAA GTTGGATGAA ACTGGTAACT 960 

CCTTGAAAGT AATACATGAA CAAGTAAACC ACAGGTGGGA AGTGTGTTTA ACTATGAGTG 102 0 

AAAAAGGCTT TCAGCAAATT AGCTTTGTCA ACAGCATTGC TACAT CCAAG GGTGGCAGAC 10 80 

ATGTTGATTA TGTAGCTGAT CAGATTGTGA CTAAACTTGT TGATGTTGTG AAGAAGAAGA 1140 

ACAAGGGTGG TGTTGCAGTA AAAGCACATC AGGTGAAAAA TCACATGTGG ATTTTTGTAA 12 00 

ATGCCTTAAT TGAAAACCCA ACCTTTGACT CTCAGACAAA AGAAAACATG ACTTTACAAC 12 60 

CCAAGAGCTT TGGATCAACA TGCCAATTGA GTGAAAAATT TATCAAAGCT GCCATTGGCT 132 0 

GTGGTATTGT AGAAAGCATA CTAAACTGGG TGAAGTTTAA GGCCCAAGTC CAGTTAAACA 1380 

AGAAGTGTTC AGCTGTAAAA CATAATAGAA TCAAGGGAAT TCCCAAACTC GATGATGCCA 1440 

ATGATGCAGG GGGCCGAAAC TCCACTGAGT GTACGCTTAT CCTGACTGAG GGAGATT CAG 1500 

CCAAAACTTT GGCTGTTTCA GGCCTTGGTG TGGTTGGGAG AGACAAATAT GGGGTTTTCC 1560 

CTCTTAGAGG AAAAATACTC AATGTTCGAG AAGCTTCTCA TAAGCAGATC ATGGAAAATG 1620 

CTGAGATTAA C AAT AT CAT C AAGATTGTGG GTCTTCAGTA CAAGAAAAAC TATGAAGATG 1680 

AAGATTCATT GAAGACGCTT CGT T ATGGGA AGATAATGAT TATGACAGAT CAGGACCAAG 1740 

ATGGT TCCCA CATCAAAGGC TTGCTGATTA ATTTTATCCA TCACAACTGG CCCTCTCTTC 180 0 

TGCGACATCG TTTTCTGGAG GAATTTATCA CTCCCATTGT AAAGGTATCT AAAAACAAGC 18 60 

AAGAAATGGC ATTTTACAGC CTTCCTGAAT TTGAAGAGTG GAAGAGTTCT ACTCCAAATC 1920 

ATAAAAAATG GAAAGTCAAA TATTACAAAG GTTTGGGCAC CAGCACATCA AAGGAAGCTA 1980 

AAGAATACTT TGCAGATATG AAAAGACATC GTATCCAGTT CAAATATTCT GGTCCTGAAG 2040 

ATGATGCTGC TATCAGCCTG GCCTTTAGCA AAAAACAGAT AGATGATCGA AAGGAATGGT 2100 

TAACTAATTT CATGGAGGAT AGAAGACAAC GAAAGTTACT TGGGCTTCCT GAGGATTACT 2160 

TGTATGGACA AACTACCACA TATCTGACAT ATAATGACTT CAT CAAC AAG GAACTTATCT 2220 

TGTTCTCAAA TTCTGATAAC GAGAGATCTA TCCCTTCTAT GGTGGATGGT TTGAAACCAG 2280 

GTCAGAGAAA GGTTTTGTTT ACTTGCTTCA AACGGAATGA CAAGCGAGAA GTAAAGGTTG 2340 

CCCAATTAGC TGGATCAGTG GCTGAAATGT CTTCTTATCA TCATGGTGAG ATGTCACTAA 240 0 

TGATGACCAT TATCAATTTG GCTCAGAATT TTGTGGGTAG CAATAATCTA AACCTCTTGC 2460 

AGCCCATTGG TCAGTTTGGT ACCAGGCTAC ATGGTGGCAA GGATTCTGCT AGTCCACGAT 252 0 

ACATCTTTAC AATGCT CAGC TCTTTGGCTC GATTGTTATT TCCACCAAAA GATGATCACA 2580 

CGTTGAAGT T TTTATATGAT GACAACCAGC GTGTTGAGCC TGAATGGTAC ATTCCTATTA 2 640 

TTCCCATGGT GCTGATAAAT GGTGCTGAAG GAATCGGTAC TGGGTGGTCC TGCAAAATCC 2 70 0 

CCAACTTTGA TGTGCGTGAA ATTGTAAATA ACATCAGGCG TTTGATGGAT GGAGAAGAAC 2760 

CTTTGCCAAT GCTTCCAAGT TACAAGAACT TCAAGGGTAC TATTGAAGAA CTGGCTCCAA 2820 

AT CAAT ATGT GATTAGTGGT GAAGTAGCTA TTCTTAATTC TACAACCATT GAAATCTCAG 2880 

AGCTTCCCGT CAGAACATGG ACCCAGACAT ACAAAGAACA AGTTCTAGAA CCCATGTTGA 2 940 

ATGGCACCGA GAAGACACCT CCTCTCATAA CAGACTATAG GGAATACCAT ACAGATACCA 3000 

CTGTGAAATT TGTTGTGAAG ATGACTGAAG AAAAACTGGC AGAGGCAGAG AGAGTTGGAC 3060 

TACACAAAGT CTTCAAACTC CAAACTAGTC TCACATGCAA CTCTATGGTG CTTTTTGACC 3120 

ACGTAGGCTG TTTAAAGAAA TATGACACGG TGTTGGATAT TCTAAGAGAC TTTTTTGAAC 3180 

TCAGACTTAA ATATTATGGA TTAAGAAAAG AATGGCTCCT AGGAATGCTT GGTGCTGAAT 3240 

CTGCTAAACT G AAT AAT CAG GCTCGCTTTA T CTTAGAGAA AAT AG AT G G C AAAATAATCA 33 0 0 
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TTGAAAATAA GCCTAAGAAA 
ATCCTGTGAA GGCCTGGAAA 
AGAGTGACAA CGAAAAGGAA 
TCAACTATCT TCTTGATATG 
GCAGGCTAAG AAATGAAAAA 
ATTTGTGGAA AGAAGACTTG 
AAAAACAAGA TGAACAAGTC 
CACAAATGGC TGAAGTTTTG 
TAGAAATGAA AGCAGAGGCA 
AAGGAAGCCC TCAAGAAGAT 
AACAGAAAAG AGAACCAGGT 
TCAAAAAAGG AAAGAAGAGA 
AAAGTAATTT TGATGTCCCT 
AATTCACAAT GGATTTGGAT 
ATGAAGATTT TGTCCCATCA 
GTAACAAAGA ACTGAAACCA 
AGGGCAGTGT ACCACTGTCT 
TTACAAACCC AGTTCCTAAA 
CTTCCACCTC CACTACCGGT 
CAGCTTTGAA TTCTGGTGTC 
AAAGGAAGCC ATCCACTTCT 
CAGTCACAAG CAAGAAATCC 
CTGTGGCTCC TCGGGCAAAA 
CAGATGAAGA TGATCTGTTT 
GCCCAAGACT GGTTTTAAAG 
TGGGGAAGGT GTTTTTAGTA 
TTTTTATAAT ACTGTCTAAA 
TCTGTGTTTT GAGTCTGCTT 
TGTAGAAATA GCTATCTGAT 
AGCTAAAACT AGAGCAGTTT 
AGATATGAGA TAG AG CATAA 
GATAGAACTT TATGGTTCTA 
TTTTTCTTTA AG C AATGAGA 
AAAGAAAAAC ACTTTGGCTG 
GAGTAGTTAT GTGATTATTT 
ATCTCCCAAA GAGAGAAACC 
CATTTGATCC AAGATCTTAA 
TTCATTTTGG GAAATCTCCA 
GTTATATGTG TGTGACTTGA 
TCTATTAGCT AAATTCCAAC 
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GAATTAATTA 
GAAGCCCAGC 
ACTGAAAAGA 
CCCCTTTGGT 
GAACAAGAGC 
GCTACATTTA 
GGACTTCCTG 
CCTTCTCCGC 
GAAAAGAAAA 
GGTGTGGAAC 
ACAAAGACAA 
AATCCCTGGC 
CCACGAGAAA 
TCAGATGAAG 
GATGCTAGTC 
CAGAAAAGTG 
TCAAGCCCTC 
AAGAATGTGA 
GCCAAAAAAA 
TCTCAAAAGC 
GATGATTCTG 
AAGGGGGAGA 
TCTGTACGGG 
TAAAATGTGA 
TTACCTGAAG 
CAAGACATCA 
TAGTGACCAT 
TCTTTTGTCT 
CACTTCAGCG 
GATTTAAAAG 
TTATCTGTTT 
GTACAGATAC 
AATTGCTCAT 
TGTCTATAAC 
CAGCTCTTGA 
AATTTCTAAG 
ATGTTATATT 
TAATTTCAAT 
GTAATGTTAT 
AATTTTGTAC 



AAGTT CTGAT 
AAAAGGTTCC 
GTGACTCCGT 
ATTTAACCAA 
TGGACACATT 
TTGAAGAATT 
GGAAAGGGGG 
GTGGTCAAAG 
ATAAAAAGAA 
TAGAAGGCCT 
AGAAACAAAC 
CTGATTCAGA 
CAGAGCCACG 
ATTTCTCAGA 
CACCTAAGAC 
TCGTGTCAGA 
CTGCTACACA 
CAGTGAAGAA 
GGGCTGCCCC 
CTGATCCTGC 
ACTCTAATTT 
GTGATGACTT 
CAAAGAAACC 
GGCGATTATT 
CTCTTAACTT 
AAGTGAAGTA 
CTCATGGGCA 
TTAAAACCTG 
TAAAGCAGTG 
TGTCACTCTT 
TATCTTAGTT 
TCTACTACAC 
GTTCTTCATC 
TTGACACAGT 
CCTGTCCCCT 
AGGACTGGAT 
GATAACCATG 
TTGTAAACTT 
CAACGTTTTT 
TTTAATAAAA 



TCAGAGGGGA 
AGATGAAGAA 
AACAGATTCT 
GGAAAAGAAA 
AAAAAGAAAG 
GGAGGCTGTT 
GAAGGCCAAG 
AGTCATTCCA 
AATTAAGAAT 
AAAACAAAGA 
TACATTGGCA 
AT CAG AT AG G 
GAGAGCAGCA 
TTTTGATGAA 
CAAAACTTCC 
CCTTGAAGCT 
TTTCCCAGAT 
GACAGCAGCA 
AAAAGGAACT 
CAAAACCAAG 
TGAGAAAATT 
CCATATGGAC 
TATAAAGTAC 
TTAAGTAATT 
CCTCCCCTCT 
AAGCCCAAGT 
TTGTTTTCTT 
ATTTTTAAGT 
TGTTTATTAA 
CGTCCTTTTC 
TTATACATAA 
TCAGCCTCTT 
TTCTCAAATC 
CAATAGAATG 
CTGGCTGCCT 
TGCAGAAGAC 
CTCAGCAATG 
TGTTAAGACC 
GTAAATATTT 
TGTTCTAAAC 



TATGATTCGG 3360 

GAAAATGAAG 342 0 

GGACCAACCT 3480 

GATGAACTCT 3540 

AGT CCATCAG 3600 

GAAGCCAAGG 3660 

GGGAAAAAAA 372 0 

CGAATAACCA 3 780 

G AAAAT A CTG 3 840 

TTAGAAAAGA 3900 

TTTAAGCCAA 3 960 

AGCAGTGACG 4020 

ACAAAAACAA 4080 

AAAACTGATG 4140 

CCAAAACTTA 42 00 

GATGATGTTA 4260 

GAAACTGAAA 4320 

AAAAGTCAGT 4380 

AAAAGGGATC 4440 

AATCGCCGCA 4500 

GTTTCGAAAG 4560 

TTTGACTCAG 4620 

CTGGAAGAGT 4680 

ATCTTACCAA 4 740 

GAATTTAGTT 4800 

GTTCTTTAGC 48 60 

CTCTGCTTTG 4 92 0 

TCTTCTGAAC 4 980 

CCATCCACTA 5040 

TACTTTCAGT 5100 

TTTACCATCA 5160 

ATGTGCCAAG 522 0 

ATCAGAGGCC 52 80 

AAG AAAAT T A 5340 

CTGAGT CTGA 5400 

TCGGGGACAA 5460 

AG CTAT TAG A 552 0 

TGTCTACATT 5580 

ACTATGTTTT 5640 
ATTGC 



Seq ID NO: 178 Protein sequence: 
Protein Accession #: NP 001058.1 
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MEVSPLQPVN 
MWVYDEDVGI 
NGKGIPWEH 
TASREYKKMF 
RRAYD I AGST 
LTMSEKGFQQ 
WIFVNALIEN 
VQLNKKCSAV 
YGVFPIiRGKI 
DQDQDGSHIK 
STPNHKKWKV 
RKEWLTNFME 
GLKPGQRKVL 
LNLLQPIGQF 
YIPIIPMVLI 
ELAPNQYVIS 
HTDTTVKFW 
DFFELRLKYY 
GYDSDPVKAW 
KDELCRLRNE 
KGKKTQMAEV 
RLEKKQKREP 
ATKTKFTMDL 
ADDVKGSVPIi 
TKRDPALNSG 
DFDSAVAPRA 



11 
I 

ENMQVNKI KK 
NYREVTFVPG 
KVEKMYVPAL 
KQTWMDNMGR 
KDVKVFLNGN 
ISFVNSIATS 
PTFDSQTKEN 
KHNRIKGIPK 
LNVREASHKQ 
GLLINFIHHN 
KYYKGLGTST 
DRRQRKLLGL 
FTCFKRNDKR 
GTRLHGGKDS 
NGAEG I GTGW 
GEVAI LNSTT 
KMTEEKLAEA 
GLRKEWLLGM 
KEAQQKVPDE 
KEQELDTLKR 
LPSPRGQRVI 
GTKTKKQTTL 
DSDEDFSDFD 
SSSPPATHFP 
VSQKPDPAKT 
KSVRAKKPIK 



21 



31 



41 



NEDAKKRLSV 
LYKIFDEILV 
IFGQLLTSSN 
AGEMELKPFN 
KLPVKGFRSY 
KGGRHVDYVA 
MTLQPKSFGS 
LDDANDAGGR 
I MENAE INN I 
WPS LLRHRFL 
SKEAKEYFAD 
PEDYLYGQTT 
E VKVAQL AG S 
AS PRY I FTML 
SCKIPNFDVR 
IEISELPVRT 
ERVGLHKVFK 
LiGAE S AKLNN 
EENEESDNEK 
KSPSDLWKED 
PRITIEMKAE 
AFKP I KKGKK 
EKTDDEDFVP 
DETEITNPVP 
KNRRKRKPST 
YLEESDEDDL 



ERIYQKKTQL 
NAADNKQRDP 
YDDDEKKVTG 
GEDYTCITFQ 
VDMYLKDKLD 
DQ I VTKLVDV 
TCQLSEKFIK 
NSTECTIiILT 
IKIVGLQYKK 
EEFITPIVKV 
MKRHRIQFKY 
TYLTYNDFIN 
VAEMSSYHHG 
SSLARLLFPP 
EIVNNIRRLM 
WTQTYKEQVL 
LQTSLTCNSM 
QARFILEKID 
ETEKSDSVTD 
LATFIEELEA 
AEKKNKKK I K 
RNPWPDSESD 
SDASPPKTKT 
KKNVTVKKTA 
SDDSDSNFEK 
F 



EHILLRPDTY 
KMSCIRVTID 
GRNGYGAKLC 
PDLSKFKMQS 
ETGNSLKVIH 
VKKKNKGGVA 
AAIGCGIVES 
EGDSAKTLAV 
NYEDEDSLKT 
SKNKQEMAFY 
SGPEDDAAIS 
KELILFSNSD 
EMSLMMTIIN 
KDDHTLKFLY 
DGEEPLPMLP 
EPMLNGTEKT 
VLFDHVGCLK 
GKI I IENKPK 
SGPTFNYLLD 
VEAKEKQDEQ 
NENTEGSPQE 
RSSDESNFDV 
SPKLSNKELK 
AKSQSSTSTT 
IVSKAVTSKK 



51 
I 

IGSVELVTQQ 60 

PENNLISIWN 120 

NIFSTKFTVE 180 

LDKDIVALMV 240 

EQVNHRWEVC 3 00 

VKAHQVKNHM 3 60 

ILNWVKFKAQ 42 0 

SGLGWGRDK 480 

LRYGKIMIMT 540 

SLPEFEEWKS 60 0 

LAFSKKQIDD 660 

NERSIPSMVD 72 0 

LAQNFVGSNN 780 

DDNQRVEPEW 840 

SYKNFKGTIE 90 0 

PPLITDYREY 960 

KYDTVLDILR 102 0 

KELIKVLIQR 10 80 

MPLWYLTKEK 1140 

VGLPGKGGKA 12 00 

DGVEIiEGLKQ 1260 

PPRETEPRRA 13 20 

PQKSWSDLE 13 80 

GAKKRAAPKG 1440 

SKGESDDFHM 1500 



75 



80 



85 



Seq ID NO: 179 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 148-7095 



I 



CACACATACG 
CAAAAAAAAC 
CGGCGAGGGG 
CAGCTCCTCT 
CTTGTTGAAG 
AAATATCCAA 
CAAGTAAATG 



11 
I 

CACGCACGAT 
ATTTCCTTCG 
CCGCAGACCG 
GTGTTTGCCG 
AGATTGGCTG 
CATGTAATAG 
TGAATCTTAA 



21 
I 

CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 



31 
1 

TCTATACACT 
CTCTCCACTC 
CGAATCCTAA 
GCTAATGGAT 
GGAGCACTGA 
TCTCCTATCA 
TTTCAGGGTT 



41 
I 

GGAGGATTAA 
TGAGAAGCAG 
AGCGTTTCCT 
ACTACAGACA 
ATCAAAAAAA 
ATATTGATGA 
GGGATAAAAC 



51 
I 

AACAAACAAA 60 

AGGAGCCGCA 12 0 

CGCTTGCATT 180 

ACAGAGAAAA 240 

TTGGGGAAAG 3 00 

AGATCTTACA 3 60 

AT CAT TGGAA 42 0 
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AACACATTCA TTCATAACAC TGGGAAAACA 
GTCAGCGGAG GAGTTTCAGA AATGGTGTTT 
AAATGCAATA TGTCAT CTGA TGGATCAGAG 
GAGATGCAAA TCTACTGCTT TGATGCGGAC 
5 GGAAAAGGGA AGTTAAGAGC TTTATCCATT 

GATT TCAAAG CGATTATTGA TGGAGTCGAA 
TTAGATCCAT TCATACTGTT GAACCTTCTG 
AATGGCTCAT TGACATCTCC TCCCTGCACA 
ACAGTTAGCA TCTCTGAAAG CCAGTTGGCT 

10 TCTGGTTATG TCATGCTGAT GGACTACTTA 

TTCT CTAGAC AGGTGTTTTC CTCATACACT 
AGTTCAGAAC CAGAAAATGT TCAGGCTGAC 
TGGGAAAGAC CTCGAGTCGT TTATGATACC 
CAGTTGGATG GAGAGGACCA AACCAAGCAT 

15 GGTGCTATTC TCAATAATTT GCTACCCAAT 

TGCACTAATG GCTTATATGG AAAATACAGC 
AATCCTGAAC TTGATCTTTT CCCTGAATTA 
GAAGAGGGAA AAGACATTGA AGAAGGCGCT 
AACCAAATCA GGAAAAAGGA ACCCCAGATT 

20 ACGAAATACA ATGAAGCCAA GACTAACCGA 

AAGGGTGATG TTCCCAATAC ATCTTTAAAT 
ACAGAAAAAG ATATTTCCTT GACTTCTCAG 
GAAGGTACTT CAGCCTCTTT AAATGATGGC 
AACTTGTCGG GGACTGCAGA ATCCTTAAAT 

25 AGTTTATTGA CCAGTTTCAA GCTTGATACT 

GCAACTTCTG CTATCCCATT CATCTCTGAG 
GAAAACCCAG AGACAATAAC ATATGATGTC 
GAAGATTCAA CTT CAT CAGG TTCAGAAGAA 
GTGTGGTTTC CTAGCTCTAC AGACATAACA 

30 AGCTTTCTCC AGACTAATTA CACTGAGATA 

TCCTTTTCTG CAGGCCCAGT GATGT CACAG 
CATTATTCTA CCTTTGCCTA CTTCCCAACT 
TCCAGACAAC AGGATTTGGT CTCCACGGTC 
GTATACAATG GTGAGACACC TCTTCAACCT 

35 ACCCCTTTGT TGCTTGACAA TCAGATCCTC 

TCGGCCTTGC ATGCTACGCC TGTATTTCCC 
TCTTCCTATG ATGGTGCACC TTTGCTTCCA 
TTTCGCCATC TGCATACAGT TTCTCAAATC 
GATAAGGTGC CCTTGCATGC TTCTCTGCCA 

40 AGCCTTGCTC AGTATTCTGA TGTGCTGTCC 

TTTGGTAGTG AATCTGGTGT TCTTTATAAA 
AG C AGTGATG CCATGATGCA TGCACGTTCT 
GATAATGAGG GCTCCCAACA CATCTTCACT 
GAT TCTGTGG GTGTAACTTA TCAGGGTTCC 

45 CCTAAGTCTT CGTTAATAAC CCCAACTGCA 

GGTGATGGGG AATGGTCTGG AGCCTCTTCT 
GGGCTGACAG CCCTTAACAT TTCTTCACCT 
TCTGTGTTTG GTGATGATAA TAAGGCGCTT 
ACTGAACTGC AAATTCCTTC TTTCAATGAG 

50 CCCAACATGT ATGATAATGT AAATAAGTTG 

ATTTCTAGCA CCAAGGGCAT GTTT CCAGGG 
GATCATGAGA TTAGTCAAGT TCCAGAAAAT 
TCTCAAGCAT CTGGTGACAC TTCGCTTAAA 
TCCTCTGACC CTGCTTCTAG TGAAATGTTA 

55 ACCTCAGCTT CTTTTAGTAC TGAAGTATTG 

GACACCTTGC TTAAAACTGT TCTTCCAGCT 
CCCAAAGTTG ATAAAATTAG TTCTACAATG 
AGTGAAAACA TGCTGCACTC TACATCTGTA 
ATGCACTCTG CTTCACTTCA AGGTTTGACC 

60 GTTTTGTTAA AAAGTGAAAG TTCCCACCAA 

TTGTT CCAAA CGGCCAATTT GGAGATTAAC 
TTTGCTACAC CTGTTTTATC AATTGATGAA 
CATTCCGATG AAATTTTAAC CTCCACCAAA 
ATTCCAACAG TTGCTTCTGA TACATTTGTA 

65 GGGCATGTTG CCATTACAGC TGTTTCTCCC 

TTGCTGTTTC CTTCTAAGGC AACTTCTGAG 
TTAGTGGGTG GTGGTGAAGA TGGTGACACT 
AGAGGTAGTG ATGGCTTATC CATT CATAAG 
CAGGAAAAGG TAATGAATGA TTCAGACACC 

70 CCAATCTCAT ACTC ACT AT C TGAGAATTCT 

TCAGACAGTC AAACTGGTAT GGACAGAAGT 
TCCCAAAAGC ACAATGATGG AAAAGAGGAA 
CCTCTCAGCC CTGAATCTAA AGCATGGGCA 
GGGCAAGGTA CCTCAGATAG CCTTAATGAG 

75 GACACTAATG AAAAAGATGC TGATGGGATC 

GGATTCCCAC AGTCCCCAAC AT CATCTGTT 
TCAGAGGCAG AGGCCAGTAA TAGTAGCCAT 
GAATCCGAGA AGAAGGCAGT TATACCCCTT 
CTAGTGGTTC TTGTGGGTAT TCTCATCTAC 

80 TACTTAGAGG ACAGTACATC CCCTAGAGTT 

ATTTCAGATG ATGTCGGAGC AATTCCAATA 
CATGCAAGTA GTGGGTTTAC TGAAGAATTT 
CAGAGCTGTA CTGTTGACTT AGGTATTACA 
CACAAGAATC GATACATAAA TAT CGTTGCC 

85 CTTGCTGAAA AGGATGGCAA ACTGACTGAT 

AACAGACCAA AAGCTTATAT TGCTGCCCAA 
TGGAGAATGA TATGGGAACA TAATGTGGAA 



GTGGAAATTA ATCTCACTAA TGACTACCGT 480 
AAAGCAAGCA AGATAACTTT TCACTGGGGA 540 
CATAGTTTAG AAGGACAAAA ATTTCCACTT 60 0 
CGATTTTCAA GTTTTGAGGA AGCAGTCAAA 660 
TTGTTTGAGG TTGGGACAGA AGAAAATTTG 720 
AGTGTTAGTC GTTTTGGGAA GCAGGCTGCT 780 
CCAAACTCAA CTGACAAGTA TTACATTTAC 840 
GACACAGTTG ACTGGATTGT TTTTAAAGAT 900 
GTTTTTTGTG AAGTTCTTAC AATGCAACAA 960 

CAAAACAATT TTCGAGAGCA ACAGTACAAG 102 0 

GGAAAGGAAG AGATTCATGA AGCAGTTTGT 1080 

CCAGAGAATT ATACCAGCCT TCTTGTTACA 1140 

ATGATTGAGA AGTTTGCAGT TTTGTACCAG 12 00 

GAATTTTTGA CAGATGGCTA TCAAGACTTG 12 60 

ATGAGTTATG TT CTT CAG AT AGTAGCCATA 132 0 

GACCAACTGA TTGTCGACAT GCCTACTGAT 13 80 

ATTGGAACTG AAGAAATAAT CAAGGAGGAG 1440 

ATTGTGAATC CTGGTAGAGA CAGTGCTACA 1500 

TCTACCACAA CACACTACAA TCGCATAGGG 1560 

TCCCCAACAA GAGGAAGTGA ATTCTCTGGA 162 0 

TCCACTTCCC AACCAGTCAC TAAATTAGCC 1680 

ACTGTGACTG AACTGCCACC TCACACTGTG 1740 

TCTAAAACTG TTCTTAGATC TCCACATATG 180 0 

ACAGTTTCTA TAACAGAATA TGAGGAGGAG 1860 

GGAGCTGAAG ATTCTTCAGG CTCCAGTCCC 1920 

AACATAT CCC AAGGGTATAT ATTTTCCTCC 1980 

CTTATACCAG AATCTGCTAG AAATGCTTCC 2040 

TCACTAAAGG ATCCTTCTAT GGAGGGAAAT 210 0 

GCACAGCCCG ATGTTGGATC AGGCAGAGAG 2160 

CGTGTTGATG AAT CTGAGAA GACAACCAAG 222 0 

GGTCCCTCAG TTACAGATCT GGAAATGCCA 22 80 

GAGGTAACAC CTCATGCTTT TACCCCATCC 2340 

AACGTGGTAT ACTCGCAGAC AACCCAACCG 240 0 

TCCTACAGTA GTGAAGTCTT TCCTCTAGTC 2460 

AACACTACCC CTGCTGCTTC AAGTAGTGAT 2520 

AGTGTCGATG TGTCATTTGA ATCCATCCTG 2580 

TTTTCCTCTG CTTCCTTCAG TAGTGAATTG 2 640 

CTTCCACAAG TTACTTCAGC TACCGAGAGT 2700 

GTGGCTGGGG GTGATTTGCT AT T AGAGCCC 2 760 

ACT ACT CATG CTGCTTCAGA GACGCTGGAA 2 82 0 

ACGCTTATGT TTTCTCAAGT TGAACCACCC 2 880 

TCAGGGCCTG AACCTTCTTA TGCCTTGTCT 2 940 

GTTT CTTACA GTTCTGCAAT ACCTGTGCAT 3000 

TTATTTAGCG GCCCTAGCCA TATACCAATA 3 0 60 

TCATTACTGC AGCCTACTCA TGCCCTCTCT 312 0 

GATAGTGAAT TTCTTTTACC TGACACAGAT 3180 

GTTTCTGTAG CTGAATTTAC ATATACAACA 3 240 

TCTAAAAGTG AAATAATATA TGGAAATGAG 33 0 0 

ATGGTTTACC CTTCTGAAAG CACAGTCATG 33 60 

AATGCGTCTT TACAAGAAAC CTCTGTTTCC 342 0 

TCCCTTGCTC ATACCACCAC TAAGGTTTTT 3480 

AACTTTTCAG TTCAACCTAC ACATACTGTC 3540 

CCTGTGCTTA GTGCAAACTC AGAGCCAGCA 3 60 0 

TCTCCTTCAA CTCAGCTCTT ATTTTATGAG 3 660 

CTACAACCTT CCTTTCAGGC TTCTGATGTT 3 72 0 

GTGCCCAGTG ATCCAATATT GGTTGAAACC 3 780 

TTGCATCTCA TTGTATCAAA TTCTGCTTCA 3 840 

CCAGTTTTTG ATGTGTCGCC TACTTCTCAT 3 900 

ATTTCCTATG CAAGTGAGAA ATATGAACCA 3 960 

GTGGTACCTT CTTTGTACAG TAATGATGAG 402 0 

CAGGCCCATC CCCCAAAAGG AAGGCATGTA 4080 

CCATTAAATA CACTAATAAA TAAG CT TATA 4140 

AGTTCTGTTA CTGGTAAGGT ATTTGCTGGT 42 00 

TCTACTGATC ATTCTGTTCC TATAGGAAAT 42 60 

CACAGAGATG GTTCTGTAAC CTCAACAAAG 432 0 

CTGAGT CAT A GTGCCAAATC TGATGCCGGT 43 80 

GATGATGATG GTGATGATGA TGATGATGAC 4440 

TGTATGTCAT GCTCATCCTA TAGAGAATCA 4500 

CACGAAAACA GTCTTATGGA TCAGAATAAT 4560 

GAAGAAGATA ATAGAGTCAC AAGTGTATCC 4620 

CCTGGTAAAT CACCATCAGC AAATGGGCTA 4680 

AATGACATTC AGACTGGTAG TGCTCTGCTT 4740 

GTTCTGACAA GTGATGAAGA AAGTGGATCA 4 800 

AATGAGACTT CCACAGATTT CAGTTTTGCA 4 860 

CTGGCAGCAG GTG ACT CAGA AATAACTCCT 4920 

ACTAGCGAGA ACTCAGAAGT GTTCCACGTT 4980 

GAGTCTCGTA TTGGTCTAGC TGAGGGGTTG 5040 

GTGATCGTGT CAGCCCTGAC TTTTATCTGT 5100 

TGGAGGAAAT GCTTCCAGAC TGCACACTTT 5160 

AT AT CCAC AC CTCCAACACC TATCTTTCCA 5220 

AAGCACTTTC CAAAGCATGT TGCAGATTTA 52 80 

GAGACACTGA AAGAGTTTTA CCAGGAAGTG 5340 

GCAGACAGCT CCAACCACCC AGACAACAAG 540 0 

TATGATCATA GCAGGGTTAA G C TAG CACAG 5460 

TATATCAATG CCAATTATGT TGATGGCTAC 5520 

GGCCCACTGA AATCCACAGC TGAAGATTTC 5580 

GTTATTGTCA TGATAACAAA CCTCGTGGAG 5640 
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AAAGGAAGGA GAAAATGTGA 
TTTCTGGTCA CTCAGAAGAG 
CTAAGAAACA CAAAAATAAA 
A CACAGT AT C ACTACACGCA 
CTGACCTTTG TGAGAAAGGC 
CACTGCAGTG CTGGAGTTGG 
CAGATTCAAC ACGAAGGAAC 
AGAAATTATT TGGTACAAAC 
GCCATACTTA GTAAAGAAAC 
CTCCTCATTC CTGGACCAGC 
CAGTCAAATA TACAGCAGAG 
AATCGAACTT CTTCTATCAT 
GGAGAAGGCA CAGACTACAT 
TTCATCATTA CCCAGCACCC 
GACCATAATG CCCAACTGGT 
TTTGTTTACT GGCCAAATAA 
ATGGCTGAAG AACACAAATG 
TTAGAAGCTA CACAGGATGA 
CCAAAT C CAG ATAGCCCCAT 
GCTGCCAATA GGGATGGGCC 
ACTTTCTGTG CTCTGACAAC 
TACCAGGTAG CCAAGATGAT 
TATCAGTTTC TCTACAAAGT 
TCCACCTCTC TGGACAGTAA 
GAGTCTTTAG TTTAACACAG 
TTCCTAAAAT TAGGCAGGAA 
GACAGTAACT TTCATGACAT 
CTTTTTGCAA GACTTGTAAT 
TATTTCTAAG AATGGAATTG 
T T T AT AG AGG TTAGGAATTC 
GCTGTATTTG TAGCAATTAT 
AAATAAAACA CTCTTCCATA 
AGAAATAATC TGTTACTTAT 
TTTATAATTG TAGATTTTTA 
GTTTAGT TTA ATGACGTAGT 
TTGTGTTACC T AAGT CAT T A 
GAAATACCTT CATTTTGAAA 
AATGGTTTTT ATCCAAGGAA 
AAAAAAAAAA AAAAAAAAAA 



TCAGTACTGG 
TGTGCAAGTG 
AAAGGGCTCC 
GTGGCCTGAC 
AGCCTATGCC 
AAGAACAGGC 
TGTCAACATA 
TGAGGAGCAA 
TGAGGTGCTG 
AGGCAAAACA 
TGACTATTCT 
CCCTGTGGAA 
CAATGCCTCC 
TCTCCTTCAT 
GGTTATGATT 
AGATGAGCCT 
TCTATCTAAT 
TTATGTACTT 
TAGTAAAACT 
TATGATTGTT 
CCTTATGCAC 
CAAT CTGATG 
GAT CCTCAGC 
TGGTGCAGCA 
AAAGGGGTGG 
AATCAGTCTA 
AGGATTCTGC 
TTACTTATTA 
TGGTATTTTT 
CAAACTACAG 
CAGGTTTGCT 
TGATATTCAA 
TGTAAATACT 
TATTTTACTA 
TCATTAGCTG 
ACTTTGTTTC 
GAAGTTTTTA 
TTGCAAAAAT 
AAAA 



CCTGCCGATG 
CTTGCCTATT 
CAGAAAGGAA 
ATGGGAGTAC 
AAGCGCCATG 
ACATATATTG 
TTTGGCTTCT 
TATGTCTTCA 
GACAGT CATA 
AAGCTAGAGA 
GCAGCCCTAA 
AGATCAAGGG 
TATATCATGG 
ACCATCAAGG 
CCTGATGGCC 
ATAAATTGTG 
GAGGAAAAAC 
GAAGTGAGGC 
TTTGAACTTA 
CATGATGAGC 
CAACTAGAAA 
AGGCCAGGAG 
CTTGTGAGCA 
TTGCCTGATG 
GGGGACTCAC 
GTTCTGTTAT 
CGCCAAATTT 
TGTTTGAACT 
TTCTGTATTG 
AAAATGTTTG 
AGAAATATAA 
CATTTTACAA 
GCCCTAGTGT 
CTGAGTCAAG 
GTCTTACTCT 
AGCATGTAAT 
TGAGAATAAC 
AAATATAAAT 



GGAGTGAGGA 
ATACTGTGAG 
GACCCAGTGG 
CAGAGTACTC 
CAGTGGGGCC 
TGCTAGACAG 
TAAAACACAT 
TTCATGATAC 
TTCATGCCTA 
AACAATTCCA 
AGCAATGCAA 
TTGGCATTTC 
GCTATTACCA 
ATTTCTGGAG 
AAAACATGGC 
AGAG CTTTAA 
TTATAATTCA 
ACTTTCAGTG 
TAAGTGTTAT 
ATGGAGGAGT 
AAGAAAATTC 
TCTTTGCTGA 
CAAGGCAGGA 
GAAATATAGC 
ATCTGAGCAT 
CTGTTGATTT 
ATATCATTAA 
AAAATGATTG 
ATTTTAACAG 
TTTTTAGTGT 
CTTTTAATAC 
CTGCAGTATT 
CTCCATGGAC 
TTTTCTAGTT 
ACCAGTTTTC 
TTTAACTTTT 
ACCTTACCAA 
ATTGCCATTA 



GTACGGGAAC 5700 

GAATTTTACT 5760 

ACGTGTGGTC 5820 

CCTGCCAGTG 5880 

TGTTGTCGTC 5940 

TATGTTGCAG 6000 

CCGTTCACAA 6060 

ACTGGTTGAG 612 0 

TGTTAATGCA 6180 

GCTCCTGAGC 6240 

CAGGG AAAAG 6300 

ATCCCTGAGT 63 60 

GAGCAATGAA 6420 

GATGATATGG 6480 

AGAAGATGAA 6540 

GGT CACTCTT 6600 

GGACTTTATC 6660 

TCCTAAATGG 6720 

AAAAG AAGAA 6780 

GACGGCAGGA 6840 

CGTGGATGTT 6900 

CATTGAGCAG 6960 

AGAGAATCCA 7020 

TGAGAGCTTA 70 80 

TGTTTTCCTC 7140 

CCCATCACCT 7200 

CAATGTGTGC 7260 

AATTTTACAG 7320 

AAAATTTCAA 7380 

CAAATTTTTA 7440 

AGTAGCCTGT 7500 

CACCTAAAGT 7560 

CAAATTTATA 7620 

CTGTGTAATT 7 680 

TGACATTGTA 7740 

GTGGAAAATA 7800 

ACATTGTTCA 7860 

AAAAAAAAAA 792 0 
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Seq ID NO: 180 Protein sequence: 
Protein Accession #: Eos sequence 



85 



1 

1 

MRILKRFLAC 
QSPINIDEDL 
FKASKITFHW 
ILFEVGTEEN 
TDTVDWIVFK 
TGKEEIHEAV 
HEFLTDGYQD 
LIGTEEI IKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
LNTTPAASSS 
ILPQVTSATE 
KTLMFSQVEP 
SLFSGPSHIP 
PVSVAEFTYT 
LNASLQETSV 
KPVLSANSEP 
AVPSDPILVE 
TISYASEKYE 
EPLNTLINKL 
PHRDGSVTST 
KCMSCSSYRE 
SPGKSPSANG 
ENETSTDFSF 
HESRIGLAEG 
VISTPPTPIF 
TADSSNHPDN 
QGPLKSTAED 
VLAYYTVRNF 
AKRHAVGPW 
QYVFIHDTLV 
SAALKQCNRE 
HTIKDFWRMI 
NEEKLIIQDF 
VHDEHGGVTA 
SLVSTRQEEN 



11 
1 

IQLLCVCRLD 
TQVNVNLKKL 
GKCNMSSDGS 
LDFKAI IDGV 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKDIEEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDLVST 
DSALHATPVF 
SDKVPLHASL 
PSSDAMMHAR 
IPKSSLITPT 
TSVFGDDNKA 
SISSTKGMFP 
ASSDPASSEM 
TPKVDKISST 
PVLLKSESSH 
IHSDEILTST 
KLLFPSKATS 
SQEKVMNDSD 
LSQKHNDGKE 
ADTNEKDADG 
LESEKKAVIP 
PISDDVGAIP 
KHKNRYINIV 
FWRMIWEHNV 
TLRNTKIKKG 
VHCSAGVGRT 
EAILSKETEV 
KNRTSSIIPV 
WDHNAQLWM 
ILEATQDDYV 
GTFCALTTLM 
PSTSLDSNGA 



21 
1 

WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLLV 
NMSYVLQIVA 
AIVNPGRDSA 
N ST SQPVTKIi 
NTVSITEYEE 
VLIPESARNA 
IRVDESEKTT 
VNWYSQTTQ 
PSVDVSFESI 
PVAGGDLLLE 
SSGPEPSYAL 
ASLLQPTHAL 
LSKSEIIYGN 
GSLAHTTTKV 
LSPSTOLLFY 
MLHLIVSNSA 
QWPSLYSND 
KSSVTGKVFA 
ELSHSAKSDA 
THENSLMDQN 
ENDIQTGSAL 
ILAAGDSEIT 
LVIVSALTFI 
IKHFPKHVAD 
AYDHSRVKLA 
EVIVMITNLV 
SQKGRPSGRV 
GTYIVLDSML 
LDSHIHAYVN 
ERSRVGISSL 
I PDGQNMAED 
LEVRHFQCPK 
HQLEKENSVD 
ALPDGNIAES 



31 
1 

KLVEEIGWSY 

ENTFIHNTGK 

LEMQIYCFDA 

ALDPFILLNL 

QSGYVMLMDY 

TWERPRWYD 

ICTNGLYGKY 

TNQIRKKEPQ 

ATEKDISLTS 

ESLLTSFKLD 

SEDSTSSGSE 

KSFSAGPVMS 

PVYNGETPLQ 

LSSYDGAPLL 

PSLAQYSDVL 

SDNEGSQHIF 

SGDGEWSGAS 

ETELQIPSFN 

FDHEISQVPE 

ETSASFSTEV 

SSENMLHSTS 

ELFQTANLEI 

GIPTVASDTF 

GLVGGGEDGD 

NPISYSLSEN 

LPLSPESKAW 

PGFPQSPTSS 

CLWLVGILI 

LHASSGFTEE 

QLAEKDGKLT 

EKGRRKCDQY 

VTQYHYTQWP 

QQIQHEGTVN 

ALL I PGP AGK 

SGEGTDYINA 

EFVYWPNKDE 

WPNPDSPISK 

VYQVAKMINL 

LESLV 



41 

1 

TGALNQKNWG 

TVEINLTNDY 

DRFSSFEEAV 

LPNSTDKYYI 

LQNNFREQQY 

TMIEKFAVLY 

SDQLIVDMPT 

ISTTTHYNRI 

QTVTELPPHT 

TGAEDSSGSS 

ESLKDPSMEG 

QGPSVTDLEM 

PSYSSEVFPL 

PFSSASFSSE 

STTHAASETL 

TVSYSSAIPV 

SDSEFLLPDT 

EMVYPSESTV 

NNFSVQPTHT 

LLQPSFQASD 

VPVFDVSPTS 

NQAHPPKGRH 

VSTDHSVPIG 

TDDDGDDDDD 

SEEDNRVTSV 

AVLTSDEESG 

VTSENSEVFH 

YWRKCFQTAH 

FETLKEFYQE 

DYINANYVDG 

WPADGSEEYG 

DMGVPEYSLP 

IFGFLKHIRS 

TKLEKQFQLL 

SYIMGYYQSN 

PINCESFKVT 

TFELISVIKE 

MRPGVFADIE 



51 
I 

KKYPTCNSPK 60 

RVSGGVSEMV 12 0 

KGKGKLRALS 180 

YNGSLTSPPC 24 0 

KFSRQVFSSY 300 

QQLDGEDQTK 360 

DNPELDLFPE 420 

GTKYNEAKTN 480 

VEGTSASLND 540 

PATSAIPFIS 600 

NVWFPSSTDI 660 

PHYSTFAYFP 720 

VTPLLLDNQI 780 

LFRHLHTVSQ 840 

EFGSE SGVLY 900 

HDSVGVTYQG 960 

DGLTALNISS 1020 

MPNMYDNVNK 1080 

VSQASGDTSL 1140 

VDTLLKTVLP 12 00 

HMHSASLQGL 1260 

VFATPVLSID 1320 

NGHVAITAVS 13 80 

DRGSDGLSIH 1440 

SSDSQTGMDR 1500 

SGQGTSDSLN 1560 

VSEAEASNSS 162 0 

FYLEDSTSPR 1680 

VQSCTVDLGI 1740 

YNRPKAY I AA 18 00 

NFLVTQKSVQ 1860 

VLTFVRKAAY 1920 

QRNYLVQTEE 1980 

SQSNIQQSDY 2040 

EFIITQHPLL 2100 

LMAEEHKCLS 2160 

EAANRDGPMI 2220 

QYQFLYKVIL 22 80 



Seq ID NO: 181 DNA sequence 

Nucleic Acid Accession #t Eos sequence 



257 



WO 02/086443 

Coding sequence: 148-4518 



PCT/US02/12476 



1 11 21 31 41 51 

<- I 1 I 1 i I 

D CACACATACG CACGCACGAT CTCACTTCGA TCTATACACT GGAGGATTAA AACAAACAAA 60 

CAAAAAAAAC ATTTCCTTCG CTCCCCCTCC CTCTCCACTC TGAGAAGCAG AGGAGCCGCA 12 0 

CGGCGAGGGG CCGCAGACCG TCTGGAAATG CGAATCCTAA AGCGTTTCCT CGCTTGCATT 180 

CAGCTCCTCT GTGTTTGCCG CCTGGATTGG GCTAATGGAT ACTACAGACA ACAGAGAAAA 240 

CTTGTTGAAG AGATTGGCTG GTCCTATACA GGAGCACTGA ATCAAAAAAA TTGGGGAAAG 300 

10 AAATATCCAA CATGTAATAG CCCAAAACAA TCTCCTATCA ATATTGATGA AGATCTTACA 3 60 

CAAGTAAATG TGAATCTTAA GAAACTTAAA TTTCAGGGTT GGGATAAAAC ATCATTGGAA 42 0 

AACACATTCA TTCATAACAC TGGGAAAACA GTGGAAATTA ATCTCACTAA TGACTACCGT 480 

GTCAGCGGAG GAGTTT CAG A AATGGTGTTT AAAGCAAGCA AGATAACTTT TCACTGGGGA 540 

AAATGCAATA TGTCATCTGA TGGATCAGAG CATAGTTTAG AAGGACAAAA ATTTCCACTT 600 

15 GAGATGCAAA TCTACTGCTT TGATGCGGAC CGATTTTCAA GTTTTGAGGA AGCAGTCAAA 660 

GGAAAAGGGA AGTTAAGAGC TTTATCCATT TTGTTTGAGG TTGGGACAGA AGAAAATTTG 72 0 

GATTTCAAAG CGATTATTGA TGGAGT CGAA AGTGT TAGTC GTTTTGGGAA GCAGGCTGCT 780 

TTAGATCCAT TCATACTGTT GAACCTTCTG CCAAACTCAA CTGACAAGTA TTACATTTAC 840 

AATGGCTCAT TGACATCTCC TCCCTGCACA GACACAGTTG ACTGGATTGT TTTTAAAGAT 90 0 

20 ACAGT TAG CA TCTCTGAAAG CCAGTTGGCT GTTTTTTGTG AAGTTCTTAC AATGCAACAA 960 

TCTGGTTATG TCATGCTGAT GGACTACTTA CAAAACAATT TTCGAGAGCA ACAGTACAAG 102 0 

TTCTCTAGAC AGGTGTTTTC CTCATACACT GGAAAGGAAG AGATTCATGA AGCAGTTTGT 1080 

AGTTCAGAAC CAGAAAATGT TCAGGCTGAC CCAGAGAATT ATACCAGCCT TCTTGTTACA 1140 

TGGGAAAGAC CTCGAGTCGT TTATGATACC ATGATTGAGA AGTTTGCAGT TTTGTACCAG 12 00 

25 CAGTTGGATG GAGAGGACCA AACCAAGCAT GAATTTTTGA CAGATGGCTA TCAAGACTTG 1260 

GGTGCTATTC TCAATAATTT GCTACCCAAT ATGAGTTATG TTCTTCAGAT AGTAGCCATA 1320 

TGCACTAATG GCTTATATGG AAAATACAGC GACCAACTGA TTGTCGACAT GCCTACTGAT 13 80 

AATCCTGAAC TTGATCTTTT CCCTGAATTA ATTGGAACTG AAGAAATAAT CAAGGAGGAG 144 0 

GAAGAGGGAA AAGACATTGA AGAAGGCGCT ATTGTGAATC CTGGTAGAGA CAGTGCTACA 1500 

30 AACCAAATCA GGAAAAAGGA ACCCCAGATT TCTACCACAA CACACTACAA TCGCATAGGG 1560 

ACGAAATACA ATGAAGCCAA GACTAACCGA TCCCCAACAA GAGGAAGTGA ATTCTCTGGA 162 0 

AAGGGTGATG TTCCCAATAC ATCTTTAAAT TCCACTTCCC AACCAGTCAC TAAATTAGCC 1680 

ACAGAAAAAG ATATTTCCTT GACTTCTCAG ACTGTGACTG AACTGCCACC TCACACTGTG 1740 

GAAGGTACTT CAGCCTCTTT AAATGATGGC TCTAAAACTG TTCTTAGATC TCCACATATG * 180 0 

35 AACTTGTCGG GGACTGCAGA ATCCTTAAAT ACAGTTTCTA TAACAGAATA TGAGGAGGAG 1860 

AGTTTATTGA CCAGTTTCAA GCTTGATACT GGAGCTGAAG ATTCTTCAGG CTCCAGTCCC 192 0 

GCAACTTCTG CTATCCCATT CATCTCTGAG AACATATCCC AAGGGTATAT ATTTTCCTCC 198 0 

GAAAACCCAG AGACAATAAC ATATGATGTC CTTATACCAG AATCTGCTAG AAATGCTTCC 2 040 

GAAGATTCAA CTTCATCAGG TTCAGAAGAA TCACTAAAGG ATCCTTCTAT GGAGGGAAAT 2100 

40 GTGTGGTTTC CTAGCTCTAC AGACATAACA GCACAGCCCG ATGTTGGATC AGGCAGAGAG 2160 

AGCTTTCTCC AGACTAATTA CACTGAGATA CGTGTTGATG AATCTGAGAA GACAACCAAG 222 0 

TCCTTTTCTG CAGGCCCAGT GATGTCACAG GGTCCCTCAG TTACAGATCT GGAAATGCCA 2280 

CATTATTCTA CCTTTGCCTA CTTCCCAACT GAGGTAACAC CTCATGCTTT TACCCCATCC 2340 

TCCAGACAAC AGGATTTGGT CTCCACGGTC AACGTGGTAT ACTCGCAGAC AACCCAACCG 2400 

45 GTATACAATG CAGAGGCCAG TAATAGTAGC CATGAGTCTC GTATTGGTCT AGCTGAGGGG 2460 

TTGGAATCCG AGAAGAAGGC AGTTATACCC CTTGTGATCG TGTCAGCCCT GACTTTTATC 2520 

TGTCTAGTGG TTCTTGTGGG TATTCTCATC TACTGGAGGA AATGCTTCCA GACTGCACAC 2580 

TTTTACTTAG AGGACAGTAC ATCCCCTAGA GTTATATCCA CACCTCCAAC ACCTATCTTT 2 640 

CCAATTTCAG ATGATGTCGG AGCAATTCCA ATAAAGCACT TTCCAAAGCA TGTTGCAGAT 270 0 

50 TTACATGCAA GTAGTGGGTT TACTGAAGAA TTTGAGACAC TGAAAGAGTT TTACCAGGAA 2 760 

GTGCAGAGCT GTACTGTTGA CTTAGGTATT ACAGCAGACA GCTCCAACCA CCCAGACAAC 282 0 

AAGCACAAGA ATCGATACAT AAATATCGTT GCCTATGATC ATAGCAGGGT TAAGCTAGCA 2 880 

CAGCTTGCTG AAAAGGATGG CAAACTGACT GATTATATCA ATGCCAATTA TGTTGATGGC 2940 

TACAACAGAC CAAAAGCTTA TATTGCTGCC CAAGGCCCAC TGAAATCCAC AGCTGAAGAT 3 000 

55 TTCTGGAGAA TGATATGGGA ACATAATGTG GAAGTTATTG TCATGATAAC AAACCTCGTG 30 60 

GAGAAAGGAA GGAGAAAATG TGATCAGTAC TGGCCTGCCG ATGGGAGTGA GGAGTACGGG 312 0 

AACTTTCTGG TCACTCAGAA GAGTGTGCAA GTGCTTGCCT ATTATACTGT GAGGAATTTT 3180 

AGTCTAAGAA ACACAAAAAT AAAAAAGGGC TCCCAGAAAG GAAGACCCAG TGGACGTGTG 3240 

GTCACACAGT ATCACTACAC GCAGTGGCCT GACATGGGAG TACCAGAGTA CTCCCTGCCA 33 00 

60 GTGCTGACCT TTGTGAGAAA GGCAGCCTAT GCCAAGCGCC ATGCAGTGGG GCCTGTTGTC 3360 

GTCCACTGCA GTGCTGGAGT TGGAAGAACA GGCACATATA TTGTGCTAGA CAGTATGTTG 3420 

CAGCAGATTC AACACGAAGG AACTGTCAAC ATATTTGGCT TCTTAAAACA CATCCGTTCA 3480 

CAAAGAAATT ATTTGGTACA AACTGAGGAG CAATATGTCT TCATTCATGA TACACTGGTT 3 54 0 

GAGGCCATAC TTAGTAAAGA AACTGAGGTG CTGGACAGTC ATATTCATGC CTATGTTAAT 3 600 

65 GCACTCCTCA TTCCTGGACC AGCAGGCAAA ACAAAGCTAG AGAAACAATT CCAGCTCCTG 3 660 

AGCCAGTCAA ATATACAGCA GAGTGACTAT TCTGCAGCCC TAAAGCAATG CAACAGGGAA 372 0 

AAGAATCGAA CTTCTTCTAT CATCCCTGTG GAAAGATCAA GGGTTGGCAT TTCATCCCTG 37 80 

AGTGGAGAAG G CACAGACTA CATCAATGCC TCCTATATCA TGGGCTATTA CCAGAGCAAT 3 840 

GAATTCATCA TTACCCAGCA CCCTCTCCTT CATACCATCA AGGATTTCTG GAGGATGATA 3 90 0 

70 TGGGACCATA ATGCCCAACT GGTGGTTATG ATTCCTGATG GCCAAAACAT GGCAGAAGAT 3 960 

GAATTTGTTT ACTGGCCAAA TAAAGATGAG CCTATAAATT GTGAGAGCTT TAAGGTCACT 402 0 

CTTATGGCTG AAGAACACAA ATGTCTATCT AATGAGGAAA AACTTATAAT TCAGGACTTT 4080 

ATCTTAGAAG CTACACAGGA TGATTATGTA CTTGAAGTGA GGCACTTTCA GTGTCCTAAA 4140 

TGGCCAAATC CAGATAGCCC CATTAGTAAA ACTTTTGAAC TTATAAGTGT TATAAAAGAA 42 00 

75 GAAGCTGCCA ATAGGGATGG GCCTATGATT GTT CATGATG AGCATGGAGG AGTGACGGCA 4260 

GGAACTTTCT GTGCTCTGAC AACCCTTATG CACCAACTAG AAAAAGAAAA TTCCGTGGAT 4320 

GTTTACCAGG TAGCCAAGAT GATCAATCTG ATGAGGCCAG GAGTCTTTGC TGACATTGAG 43 80 

CAGTATCAGT TTCTCTACAA AGTGATCCTC AGCCTTGTGA GCACAAGGCA GGAAGAGAAT 4440 

CCATCCACCT CTCTGGACAG TAATGGTGCA GCATTGCCTG ATGGAAATAT AGCTGAGAGC 4500 

80 TTAGAGTCTT TAGTTTAACA CAGAAAGGGG TGGGGGGACT CACATCTGAG CATTGTTTTC 4560 

CTCTTCCTAA AATTAGGCAG GAAAATCAGT CTAGTTCTGT TATCTGTTGA TTTCCCATGA 4620 

CCTGACAGTA ACTTTCATGA CATAGGATTC TGCCGCCAAA TTTATATCAT TAACAATGTG 4680 

TGCCTTTTTG CAAGACTTGT AATTTACTTA TTATGTTTGA ACTAAAATGA TTGAATTTTA 4740 

CAGTATTTCT AAGAATGGAA TTGTGGTATT TTTTTCTGTA TTGATTTTAA CAGAAAATTT 4800 

85 CAATTTATAG AGGTTAGGAA TTCCAAACTA CAGAAAATGT TTGTTTTTAG TGTCAAATTT 4860 

TTAGCTGTAT TTGTAGCAAT TATCAGGTTT GCTAGAAATA TAACTTTTAA TACAGTAGCC 4920 

T GTAAAT AAA ACACTCTTCC ATATGATATT CAACATTTTA CAACTGCAGT ATTCACCTAA 4980 



258 



WO 02/086443 

AGTAGAAATA ATCTGTTACT 
AT AT T T AT AA TTGTAGATTT 
ATTGTTTAGT TTAATGACGT 
GTATTGTGTT ACCTAAGTCA 
ATAGAAATAC CTTCATTTTG 
TCAAATGGTT TTTATCCAAG 
AAAAAAAAAA AAAAAAAAAA 
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TATTGTAAAT 
TTATATTTTA 
AGTTCATTAG 
TTAACTTTGT 
AAAGAAGTTT 
GAATTGCAAA 
AAAAAAA 



ACTGCCCTAG 
CTACTGAGTC 
CTGGTCTTAC 
TTCAGCATGT 
TTATGAGAAT 
AATAAATATA 



TGTCTCCATG 
AAGTTTTCTA 
TCTACCAGTT 
AATTTTAACT 
AACACCTTAC 
AATATTGCCA 



GACCAAATTT 5040 

GTTCTGTGTA 510 0 

TTCTGACATT 5160 

TTTGTGGAAA 522 0 

CAAACATTGT 5280 

TTAAAAAAAA 5340 



10 



Seq ID NO: 182 Protein sequence: 
Protein Accession #: Eos sequence 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



I 



ii 



I 



MRILKRFLAC 
QSPINIDEDL 
FKASKITFHW 
ILFEVGTEEN 
TDTVDW I VFK 
TGKEEIHEAV 
HEFI/TDGYQD 
LIGTEEIIKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
PLVIVSALTF 
PIKHFPKHVA 
VAYDHSRVKLr 
VEVIVMITNL 
GSQKGRPSGR 
TGTYIVLDSM 
VLDSHIHAYV 
VERSRVGISS 
MIPDGQNMAE 
VLEVRHFQCP 
MHQLEKENSV 
AALPDGNIAE 



IQLLCVCRLD 
TQVNVN Li KKL 
GKCNMS SDGS 
LDFKAIIDGV 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKDIEEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDLVST 
ICLWLVGIL 
DLHASSGFTE 
AQIiAEKDGKL 
VEKGRRKCDQ 
WTQYHYTQW 
LQQIQHEGTV 
NALL I PGP AG 
LSGEGTDYIN 
DEFVYWPNKD 
KWPNPDSPIS 
DVYQVAKMIN 
SLESLV 



21 
I 

WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLIiV 
NMSYVLQIVA 
AIVNPGRDSA 
NSTSQPVTKL 
NTVSITEYEE 
Vhl PESARNA 
IRVDESEKTT 
VNWYSQTTQ 
IYWRKCFQTA 
EFETLKEFYQ 
TDY INANYVD 
YWPADGSEEY 
PDMGVPEYSLp 
NIFGFLKHIR 
KTKLEKQFQIi 
ASYIMGYYQS 
EPINCESFKV 
KTFELISVIK 
LMRPGVFAD I 



31 



KLVEEIGWSY 
ENTFIHNTGK 
LEMQIYCFDA 
ALDPFILLNL 
Q SGYVMLMD Y 
TWERPRWYD 
ICTNGLYGKY 
TNQIRKKEPQ 
ATEKDISLTS 
ESLLTSFKLD 
SEDSTSSGSE 
KSFSAGPVMS 
PVYNAEASNS 
HFYLEDSTSP 
EVQSCTVDLG 
GYNRPKAYIA 
GNFLVTQKSV 
PVLTFVRKAA 
SQRNYLVQTE 
IiSQSNIQQSD 
NEFIITQHPL 
TLMAEEHKCL 
EEAANRDGPM 
EQYQFLYKVI 



41 
I 

TGALNQKNWG 
TVEINLTNDY 
DRFSSFEEAV 
LPNSTDKYYI 
LQNNFREQQY 
TMI EKFAVLY 
SDQLIVDMPT 
ISTTTHYNRI 
QTVTELPPHT 
TGAEDSSGSS 
ESLKDPSMEG 
QGPSVTDLEM 
SHESRIGLAE 
RVISTPPTPI 
ITADSSNHPD 
AQGPIiKSTAE 
QVLAYYTVRN 
YAKRHAVGPV 
EQYVFIHDTL 
YSAALKQCNR 
LHTIKDFWRM 
SNEEKLIIQD 
IVHDEHGGVT 
LSLVSTRQEE 



51 

! 

KKYPTCNSPK 
RVSGGVSEMV 
KGKGKLRALS 
YNGSLTSPPC 
KFSRQVFSSY 
QQLDGEDQTK 
DNPELDLFPE 
GTKYNEAKTN 
VEGTSASLND 
PATSAIPFIS 
NVWFPSSTDI 
PHYSTFAYFP 
GLESEKKAVI 
FPISDDVGAI 
NKHKNRYINI 
DFWRMIWEHN 
FTLRNTKIKK 
WHCSAGVGR 
VEAILSKETE 
EKNRTSSIIP 
I WDHNAQL W 
FILEATQDDY 
AGTFCALTTL 
NPSTSLDSNG 



Seq ID NO: 183 dna sequence 

Nucleic Acid Accession #: EOS sequence 

Coding sequence: 148-4494 



11 



85 



CACACATACG 
CAAAAAAAAC 
CGGCGAGGGG 
CAGCTCCTCT 
CTTGTTGAAG 
AAATAT CCAA 
CAAGTAAATG 
AACACATTCA 
GTCAGCGGAG 
AAATG CAAT A 
GAG ATG C AAA 
GGAAAAGGGA 
GATTTCAAAG 
TTAGAT CCAT 
AATGGCTCAT 
ACAGT TAG CA 
TCTGGTTATG 
TTCTCTAGAC 
AGTT CAGAAC 
TGGGAAAGAC 
CAGTTGGATG 
GGTGCTATTC 
TGCACTAATG 
AATCCTGAAC 
GAAGAGGGAA 
AACCAAATCA 
ACGAAATACA 
AAGGGTGATG 
ACAGAAAAAG 
GAAGGTACTT 
AACTTGTCGG 
AGTTTATTGA 
GCAACTTCTG 
GAAAACCCAG 
GAAGATTCAA 
GTGTGGTTTC 
AGCTTTCTCC 
TCCTTTTCTG 
CATTATTCTA 
TCCAGACAAC 
GTATACAATG 



CACGCACGAT 
ATTTCCTTCG 
CCGCAGACCG 
GTGTTTGCCG 
AGATTGGCTG 
CATGTAATAG 
TGAATCTTAA 
TTCATAACAC 
GAGTTTCAGA 
TGTCATCTGA 
TCTACTGCTT 
AGTTAAGAGC 
CGATTAT TGA 
TCATACTGTT 
TGACATCTCC 
TCTCTGAAAG 
TCATGCTGAT 
AGGTGTTTTC 
CAGAAAATGT 
CTCGAGT CGT 
GAGAGGACCA 
TCAATAATTT 
GCTTATATGG 
TTGATCTTTT 
AAGACATTGA 
GGAAAAAGGA 
ATGAAGCCAA 
TTCCCAATAC 
ATATTTCCTT 
CAGCCTCTTT 
GGACTGCAGA 
CCAGTTTCAA 
CTATCCCATT 
AGACAATAAC 
CTTCATCAGG 
CTAGCTCTAC 
AGACTAATTA 
CAGGCCCAGT 
CCTTTGCCTA 
AGGATTTGGT 
AGGCCAGTAA 



21 
I 

CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 
TGGGAAAACA 
AATGGTGTTT 
TGGATCAGAG 
TGATGCAGAC 
TTTATCCATT 
TGGAGTCGAA 
GAACCTTCTG 
TCCCTGCACA 
CCAGTTGGCT 
GGACTACTTA 
CTCATACACT 
TCAGGCTGAC 
TTATGATACC 
AACCAAGCAT 
GCTACCCAAT 
AAAATACAGC 
CCCTGAATTA 
AGAAGGCGCT 
ACCCCAGATT 
GACTAACCGA 
ATCTTTAAAT 
GACTTCTCAG 
AAATGATGGC 
AT CCTT AAAT 
GCTTGATACT 
CATCTCTGAG 
ATATGATGTC 
TTCAGAAGAA 
AGACATAACA 
CACTGAGATA 
GATGT CACAG 
CTTCCCAACT 
CTCCACGGTC 
TAGTAGCCAT 



31 
I 

TCTATACACT 
CTCTCCACTC 
CGAATCCTAA 
GCTAATGGAT 
GGAGCACTGA 
TCTCCTATCA 
TTTCAGGGTT 
GTGGAAATTA 
AAAGCAAGCA 
CATAGTTTAG 
CGATTTTCAA 
TTGTTTGAGG 
AGTGTTAGTC 
CCAAACTCAA 
GACACAGTTG 
GTTTTTTGTG 
CAAAACAATT 
GGAAAGGAAG 
CCAGAGAATT 
ATGATTGAGA 
GAATTTTTGA 
ATGAGTTATG 
GACCAACTGA 
ATTGGAACTG 
ATTGTGAATC 
TCTACCACAA 
TCCCCAACAA 
TCCACTTCCC 
ACTGTGACTG 
TCTAAAACTG 
ACAGTTTCTA 
GGAGCTGAAG 
AACATATCCC 
CTTATACCAG 
TCACTAAAGG 
GCACAGCCCG 
CGTGTTGATG 
GGTCCCTCAG 
GAGGTAACAC 
AACGTGGTAT 
GAGTCTCGTA 



41 



51 



GGAGGATTAA 
TGAGAAGCAG 
AGCGTTTCCT 
ACTACAGACA 
ATCAAAAAAA 
ATATTGATGA 
GGGATAAAAC 
ATCTCACTAA 
AGATAACTTT 
AAGGACAAAA 
GTTTTGAGGA 
TTGGGACAGA 
GTTTTGGGAA 
CTGACAAGTA 
ACTGGATTGT 
AAGTTCTTAC 
TTCGAGAGCA 
AGATTCATGA 
ATACCAGCCT 
AGTTTGCAGT 
CAGATGGCTA 
TTCTTCAGAT 
TTGTCGACAT 
AAGAAATAAT 
CTGGTAGAGA 
CACACTACAA 
GAGGAAGTGA 
AACCAGTCAC 
AACTGCCACC 
TTCTTAGATC 
TAACAGAATA 
ATTCTTCAGG 
AAGGGTATAT 
AATCTGCTAG 
ATCCTTCTAT 
ATGTTGGATC 
AATCTGAGAA 
TTACAGATCT 
CTCATGCTTT 
ACTCGCAGAC 
TTGGTCTAGC 



AACAAACAAA 
AGGAGCCGCA 
CGCTTGCATT 
ACAGAGAAAA 
TTGGGGAAAG 
AGATCTTACA 
ATCATTGGAA 
TGACTACCGT 
TCACTGGGGA 
ATTTCCACTT 
AGCAGT CAAA 
AGAAAAT TTG 
GCAGGCTGCT 
TTACATTTAC 
TTTTAAAGAT 
AATGCAACAA 
ACAGTACAAG 
AGCAGTTTGT 
TCTTGTTACA 
TTTGTACCAG 
TCAAGACTTG 
AGTAGCCATA 
GCCTACTGAT 
CAAGGAGGAG 
CAGTGCTACA 
TCGCATAGGG 
ATTCTCTGGA 
TAAATTAGCC 
TCACACTGTG 
TCCACATATG 
TGAGGAGGAG 
CTCCAGTCCC 
ATTTTCCTCC 
AAATGCTTCC 
GGAGGGAAAT 
AGGCAGAGAG 
GACAACCAAG 
GGAAATGCCA 
TACCCCATCC 
AACCCAACCG 
TGAGGGGTTG 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
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GAATCCGAGA AGAAGGCAGT 
CTAGTGGTTC TTGTGGGTAT 
TACTTAGAGG ACAGTACATC 
ATTTCAGATG ATGTCGGAGC 
CATG CAAGTA GTGGGTTTAC 
GGT AT T AC AG CAGACAGCTC 
ATCGTTGCCT ATGATCATAG 
CTGACTGATT ATATCAATGC 
GCTGCCCAAG GCCCACTGAA 
AATGTGGAAG TTATTGTCAT 
CAGTACTGGC CTGCCGATGG 
GTGCAAGTGC TTGCCTATTA 
AAGGGCTCCC AGAAAGGAAG 
TGGCCTGACA TGGGAGTACC 
GCCTATGCCA AGCGCCATGC 
AGAACAGGCA CATATATTGT 
GTCAACATAT TTGGCTTCTT 
GAGGAGCAAT ATGTCTTCAT 
GAGGTGCTGG ACAGTCATAT 
GGCAAAACAA AGCTAGAGAA 
GACTATTCTG CAGCCCTAAA 
CCTGTGGAAA GAT CAAGGGT 
AATGCCTCCT AT AT C ATGGG 
CTCCTTCATA CCAT CAAGGA 
GTTATGATTC CTGATGGCCA 
GATGAGCCTA TAAATTGTGA 
CTATCTAATG AGGAAAAACT 
TATGTACTTG AAGTGAGGCA 
AGTAAAACTT TTGAACTTAT 
ATGATTGTTC ATGATGAGCA 
CTTATGCACC AACTAGAAAA 
AAT CTGATGA GGCCAGGAGT 
ATCCTCAGCC TTGTGAGCAC 
GGTGCAGCAT TGCCTGATGG 
AAGGGGTGGG *GGGACTCACA 
ATCAGT CT AG TTCTGTTATC 
GGATTCTGCC GCCAAATTTA 
TACTTATTAT GTTTGAACTA 
GGTATTTTTT TCTGTATTGA 
AAACTACAGA AAATGTTTGT 
AGGTTTGCTA GAAATATAAC 
GATATTCAAC ATTTTACAAC 
GTAAATACTG CCCTAGTGTC 
ATTTTACTAC TGAGTCAAGT 
CATTAGCTGG TCTTACTCTA 
CTTTGTTTCA GCATGTAATT 
AAGTTTTTAT GAGAATAACA 
TGCAAAAATA AATATAAATA 
AAA 
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TATACCCCTT 
TCTCATCTAC 
CCCTAGAGTT 
AATTCCAATA 
TGAAGAATTT 
CAACCACCCA 
CAGGGTTAAG 
CAATTATGTT 
ATCCACAGCT 
GATAACAAAC 
GAGTGAGGAG 
TACTGTGAGG 
ACCCAGTGGA 
AGAGTACTCC 
AGTGGGGCCT 
GCTAGACAGT 
AAAACACATC 
TCATGATACA 
TCATGCCTAT 
ACAATTCCAG 
GCAATGCAAC 
TGGCATTTCA 
CTATTACCAG 
TTTCTGGAGG 
AAACATGGCA 
GAGCTTTAAG 
TATAATTCAG 
CTTTCAGTGT 
AAGTGT T ATA 
TGGAGGAGTG 
AGAAAATTCC 
CTTTGCTGAC 
AAGGCAGGAA 
AAATATAGCT 
TCTGAGCATT 
TGTTGATTTC 
TATCATTAAC 
AAATGATTGA 
TTTTAACAGA 
TTTTAGTGTC 
TTTTAATACA 
TGCAGTATTC 
TCCATGGACC 
TTTCTAGTTC 
CCAGTTTTCT 
TTAACTTTTG 
CCTTACCAAA 
TTGCCATTAA 



GTGATCGTGT 
TGGAGGAAAT 
ATATCCACAC 
AAGCACTTTC 
GAGGAAGTGC 
GACAACAAGC 
CTAGCACAGC 
GATGGCTACA 
GAAGATTTCT 
CTCGTGGAGA 
TACGGGAACT 
AATTTTACTC 
CGTGTGGTCA 
CTGCCAGTGC 
GTTGTCGTCC 
ATGTTGCAGC 
CGTTCACAAA 
CTGGTTGAGG 
GTTAATGCAC 
CTCCTGAGCC 
AGGGAAAAGA 
TCCCTGAGTG 
AGCAATGAAT 
ATGATATGGG 
GAAGATGAAT 
GTCACTCTTA 
GACTTTATCT 
CCTAAATGGC 
AAAGAAGAAG 
ACGGCAGGAA 
GTGGATGTTT 
ATTGAGCAGT 
GAGAATCCAT 
GAGAGCTTAG 
GTTTTCCTCT 
CCATCACCTG 
AATGTGTGCC 
ATTTTACAGT 
AAATTTCAAT 
AAATTTTTAG 
GTAGCCTGTA 
ACCTAAAGTA 
AAATTTATAT 
TGTGTAATTG 
GACATTGTAT 
TGGAAAATAG 
CATTGTTCAA 
AAAAAAAAAA 



CAGCCCTGAC 
GCTTCCAGAC 
CTCCAACACC 
CAAAGCATGT 
AGAGCTGTAC 
ACAAGAATCG 
TTGCTGAAAA 
ACAGACCAAA 
GGAGAATGAT 
AAGGAAGGAG 
TTCTGGTCAC 
TAAGAAACAC 
CACAGTATCA 
TGACCTTTGT 
ACTGCAGTGC 
AGATTCAACA 
GAAATTATTT 
CCATACTTAG 
TCCTCATTCC 
AGTCAAATAT 
ATCGAACTTC 
GAGAAGGCAC 
TCATCATTAC 
ACCATAATGC 
TTGTTTACTG 
TGGCTGAAGA 
TAGAAGCTAC 
CAAATCCAGA 
CTGCCAATAG 
CTTTCTGTGC 
ACCAGGTAGC 
ATCAGTTTCT 
CCACCTCTCT 
AGTCTTTAGT 
TCCTAAAATT 
ACAGTAACTT 
TTTTTGCAAG 
ATTTCTAAGA 
TTATAGAGGT 
CTGTATTTGT 
AATAAAACAC 
GAAATAATCT 
TTATAATTGT 
TTTAGTTTAA 
TGTGTTACCT 
AAATACCTTC 
ATGGTTTTTA 
AAAAAAAAAA 



TTTTAT CTGT 
TGCACACTTT 
TATCTTTCCA 
TGCAGATTTA 
TGTTGACTTA 
ATACATAAAT 
GGATGGCAAA 
AGCTTATATT 
ATGGGAACAT 
AAAATGTGAT 
TCAGAAGAGT 
AAAAATAAAA 
CTACACGCAG 
GAGAAAGGCA 
TGGAGTTGGA 
CGAAGGAACT 
GGTACAAACT 
TAAAGAAACT 
TGGACCAGCA 
ACAGCAGAGT 
TTCTATCATC 
AGACTACATC 
CCAGCACCCT 
CCAACTGGTG 
GCCAAATAAA 
ACACAAATGT 
ACAGGATGAT 
TAGCCCCATT 
GGATGGGCCT 
TCTGACAACC 
CAAGATGATC 
CTACAAAGTG 
GGACAGTAAT 
TTAACACAGA 
AGGCAGGAAA 
TCATGACATA 
ACTTGTAATT 
ATGGAATTGT 
TAGGAATTCC 
AG C AAT T AT C 
TCTTCCATAT 
GTTACTTATT 
AGATTTTTAT 
TGACGTAGTT 
AAGTCATTAA 
ATTTTGAAAG 
TCCAAGGAAT 
AAAAAAAAAA 



Seq ID NO: 184 Protein sequence: 
Protein Accession #: EOS sequence 



80 



I 

MR I LKRFLAC 
QSPINIDEDL 
FKASKITFHW 
IliFEVGTEEN 
TDTVDWIVFK 
TGKEEIHEAV 
HEFLTDGYQD 
LIGTEEIIKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
LVXVSALTFI 
IKHFPKHVAD 
KLAQLAEKDG 
NLVEKGRRKC 
GRWTQYHYT 
SMLQQIQHEG 
YVNALLIPGP 
SSLSGEGTDY 
AEDEFVYWPN 
CPKWPNPDSP 
SVDVYQVAKM 
AESLESLV 



11 



IQLLCVCRLD 
TQVNVNLKKL 
GKCNMSSDGS 
LDFKAI IDGV 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKDIEEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDDVST 
CLWLVGILI 
LHASSGFTEE 
KLTDYINANY 
DQYWPADGSE 
QWPDMGVPEY 
TVNIFGFLKH 
AGKTKLEKQF 
INASYIMGYY 
KDEPINCESF 
ISKTFErilSV 
INLMRPGVFA 



21 
I 

WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLLV 
NMSYVLQIVA 
AIVNPGRDSA 
NSTSQPVTKL 
NTVSITEYEE 
VLIPESARNA 
IRVDESEKTT 
VNWYSQTTQ 
YWRKCFQTAH 
FEEVQSCTVD 
VDGYNRPKAY 
EYGNFLVTQK 
SLPVLTFVRK 
IRSQRNYLVQ 
QLLSQSNIQQ 
QSNEFIITQH 
KVTLMAEEHK 
I KEEAANRDG 
DIEQYQFLYK 



31 

I 

KLVEEIGWSY 
ENTFIHNTGK 
LEMQIYCFDA 
ALDPFILLNL 
QSGYVMLMDY 
TWERPRWYD 
ICTNGLYGKY 
TNQIRKKEPQ 
ATEKDISL.TS 
ESLLTSFKLD 
SEDSTSSGSE 
KSFSAGPVMS 
PVYNEASNSS 
FYLEDSTSPR 
LGITADSSNH 
IAAQGPLKST 
SVQVLAYYTV 
AAYAKRHAVG 
TEEQYVFIHD 
SDYSAALKQC 
PLLHTIKDFW 
CLSNEEKLII 
PM I VHDEHGG 
VILSLVSTRQ 



41 

I 

TGALNQKNWG 
TVEINLTNDY 
DRFSSFEEAV 
LPNSTDKYYI 
LQNNFREQQY 
TMIEKFAVLY 
SDQLIVDMPT 
ISTTTHYNRI 
QTVTELPPHT 
TGAEDSSGSS 
ESLKDPSMEG 
QGPSVTDLEM 
HESRIGLAEG 
VISTPPTPIF 
PDNKHKNRYI 
AEDFWRMIWE 
RNFTLRNTKI 
PVWHCSAGV 
TLVEAILSKE 
NREKNRTS S I 
RMIWDHNAQL 
QDFILEATQD 
VTAGTFCALT 
EENPSTSLDS 



51 

i 

KKYPTCNSPK 
RVSGGVSEMV 
KGKGKLRALS 
YNGSLTSPPC 
KFSRQVFSSY 
QQLDGEDQTK 
DNPELDLFPE 
GTKYNEAKTN 
VEGTSASLND 
PATSAIPFIS 
NVWFPSSTDI 
PHYSTFAYFP 
LESEKKAVIP 
PISDDVGAIP 
NIVAYDHSRV 
HNVEVIVMIT 
KKGSQKGRPS 
GRTGTYIVLD 
TEVLDSH I HA 
IPVERSRVGI 
WMIPDGQNM 
DYVLEVRHFQ 
TLMHQLEKEN 
NGAALPDGNI 



2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 
5280 
5340 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
72 0 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
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CACACATACG CACGCACGAT CTCACTTCGA TCTATACACT GGAGGATTAA AACAAACAAA 60 

CAAAAAAAAC ATTTCCTTCG CTCCCCCTCC CTCTCCACTC TGAGAAGCAG AGGAGCCGCA 12 0 

CGGCGAGGGG CCGCAGACCG TCTGGAAATG CGAATCCTAA AGCGTTTCCT CGCTTGCATT 180 

CAGCTCCTCT GTGTTTGCCG CCTGGATTGG GCTAATGGAT ACTACAGACA ACAGAGAAAA 240 

CTTGTTGAAG AGATTGGCTG GTCCTATACA GGAGCACTGA ATCAAAAAAT TGGGGAAAGA 3 00 

AATATCCAAC ATGTAATAGC CCAAAACAAT CTCCTATCAA TATTGATGAA GATCTTACAC 360 

AAGTAAATGT GAATCTTAAG AAACTTAAAT TTCAGGGTTG GGATAAAACA TCATTGGAAA 420 

ACACATTCAT TCATAACACT GGGAAAACAG TGGAAATTAA TCTCACTAAT GACTACCGTG 480 

TCAGCGGAGG AGTTTCAGAA ATGGTGTTTA AAGCAAGCAA GATAACTTTT CACTGGGGAA 540 

AATGCAATAT GTCATCTGAT GGATCAGAGC ATAGTTTAGA AGGACAAAAA TTTCCACTTG 600 
AGATGCAAAT CTACTGCTTT GATGCGGACC GATTTTCAAG TTTTGAGGAA GCAGT CAAAG 660 
GAAAAGGGAA GTTAAGAGCT TTATCCATTT TGTTTGAGGT TG GG AC AG AA GAAAATT TGG 720 
ATTTCAAAGC GATTATTGAT GGAGT CGAAA GTGTTAGTCG TTTTGGGAAG CAGGCTGCTT 780 
TAGATCCATT CATACTGTTG AACCTTCTGC CAAACTCAAC TGACAAGTAT TACATTTACA 840 
ATGGCTCATT GACATCTCCT CCCTGCACAG ACACAG T TG A CTGGATTGTT TTTAAAGATA 900 
CAGTTAGCAT CTCTGAAAGC CAGTTGGCTG TTTTTTGTGA AGTTCTTACA AT G C AACAAT 960 

CTGGTTATGT CATGCTGATG GACTACTTAC AAAACAATTT TCGAGAGCAA CAGTACAAGT 102 0 

TCTCTAGACA GGTGTTTTCC TCATACACTG GAAAGGAAGA GATTCATGAA GCAGTTTGTA 10 80 

GTTCAGAACC AGAAAATGTT CAGGCTGACC CAGAGAATTA TACCAGCCTT CTTGTTACAT 1140 

GGGAAAGACC TCGAGTCGTT TATGATACCA TGATTGAGAA GTTTGCAGTT TTGTACCAGC 1200 

AGTTGGATGG AGAGGACCAA ACCAAGCATG AATTTTTGAC AGATGGCTAT CAAGACTTGG 1260 

GTGCTATTCT CAATAATT TG CT ACCCAATA • TGAGTTATGT TCTTCAGATA GTAGCCATAT 1320 

GCACTAATGG CTTATATGGA AAATACAGCG ACCAACTGAT TGTCGACATG CCTACTGATA 13 80 

AT CCTGAACT TGATCTTTTC CCTGAATTAA TTGGAACTGA AGAAATAATC AAGGAGGAGG 1440 

AAGAGGGAAA AGACATTGAA GAAGGCGCTA TTGTGAATCC TGGTAGAGAC AGTGCTACAA 1500 

ACCAAAT CAG GAAAAAGGAA CCCCAGATTT CTACCACAAC ACACTACAAT CGCATAGGGA 1560 

CGAAATACAA TGAAGCCAAG ACTAACCGAT CCCCAACAAG AGGAAGTGAA TTCTCTGGAA 1620 

AGGGTGATGT TCCCAATACA TCTTTAAATT CCACTTCCCA ACCAGTCACT AAATTAGCCA 1680 

CAGAAAAAGA TATTTGCTTG ACTTCTCAGA CTGTGACTGA ACTGCCACCT CACACTGTGG 1740 

AAGGTACTTC AGCCTCTTTA AATGATGGCT CTAAAACTGT TCTTAGATCT CCACATATGA 180 0 

ACTTGT CGGG GACTGCAGAA TCCTTAAATA CAGTTTCTAT AACAGAATAT GAGGAGGAGA 1860 

GTTTATTGAC CAGTTTCAAG CTTGATACTG GAGCTGAAGA TTCTTCAGGC TCCAGTCCCG 1920 

CAACTTCTGC TATCCCATTC ATCTCTGAGA ACATATCCCA AGGGTATATA TTTTCCTCCG 1980 

AAAACCCAGA GACAATAACA TATGATGTCC TTATACCAGA ATCTGCTAGA AATGCTTCCG 2 040 

AAGATTCAAC TTCATCAGGT TCAGAAGAAT CACTAAAGGA TCCTTCTATG GAGGGAAATG 2100 

TGTGGTTTCC TAGCTCTACA GACATAACAG CACAGCCCGA TGTTGGATCA GGCAGAGAGA 2160 

GCTTTCTCCA GACTAATTAC ACTGAGATAC GTGTTGATGA ATCTGAGAAG ACAACCAAGT 222 0 

CCTTTTCTGC AGGCCCAGTG ATGTCACAGG GTCCCTCAGT TACAGATCTG GAAATGCCAC 2280 

ATTATTCTAC CTTTGCCTAC TTCCCAACTG AGGTAACACC TCATGCTTTT ACCCCATCCT 23 40 

CCAGACAACA GGATTTGGTC TCCACGGTCA ACGTGGTATA CTCGCAGACA ACCCAACCGG 2400 

TATACAATGA GGCCAGTAAT AGTAGCCATG AGTCTCGTAT TGGTCTAGCT GAGGGGTTGG 2460 

AATCCGAGAA GAAGGCAGTT ATACCCCTTG TGAT CGTGTC AGCCCTGACT TTTATCTGTC 2520 

TAGTGGTTCT TGTGGGTATT CTCATCTACT GGAGGAAATG CTTCCAGACT GCACACTTTT 2580 

ACTTAGAGGA CAGTACATCC CCTAGAGTTA TATCCACACC TCCAACACCT ATCTTTCCAA 2 640 

TTTCAGATGA TGTCGGAG CA ATTCCAATAA AGCACTTTCC AAAGCATGTT GCAGATTTAC 2 700 

ATGCAAGTAG TGGGTTTACT GAAGAATTTG AGACACTGAA AGAGTTTTAC CAGGAAGTGC 2 760 

AGAGCTGTAC TGTTGACTTA GGTATTACAG CAGACAGCTC CAACCACCCA GACAACAAGC 2820 

ACAAGAATCG ATACATAAAT ATCGTTGCCT ATGATCATAG CAGGGTTAAG CTAGCACAGC 2 880 

TTGCTGAAAA GGATGGCAAA CTGACTGATT ATATCAATGC CAATTATGTT GATGGCTACA 2 940 

ACAGACCAAA AGCTTATATT GCTGCCCAAG GCCCACTGAA ATCCACAGCT GAAGATTTCT 3 000 

GGAGAATGAT ATGGGAACAT AATGTGGAAG TTATTGTCAT GATAACAAAC CTCGTGGAGA 3 060 

AAGGAAGGAG AAAATGTGAT CAGTACTGGC CTGCCGATGG GAGTGAGGAG TACGGGAACT 3120 

TTCTGGTCAC TCAGAAGAGT GTGCAAGTGC TTGCCTATTA TACTGTGAGG AATTTTACTC 3180 

TAAGAAACAC AAAAATAAAA AAGGGCTCCC AGAAAGGAAG ACCCAGTGGA CGTGTGGTCA 3240 

CACAGTATCA CTACACGCAG TGGCCTGACA TGGGAGTACC AGAGTACTCC CTGCCAGTGC 33 00 

TGACCTTTGT GAGAAAGGCA GCCTATGCCA AGCGCCATGC AGTGGGGCCT GTTGTCGTCC 3 3 60 

ACTGCAGTGC TGGAGTTGGA AGAACAGGCA CATATATTGT G CT AG ACAGT ATGTTGCAGC 3420 

AGATTCAACA CGAAGGAACT GTCAACATAT TTGGCTTCTT AAAACACAT C CGTTCACAAA 3480 

GAAATTATTT GGTACAAACT GAGGAGCAAT ATGTCTTCAT TCATGATACA CTGGTTGAGG 3540 

CCATACTTAG TAAAGAAACT GAGGTGCTGG ACAGTCATAT TCATGCCTAT GTTAATGCAC 3600 

TCCTCATTCC TGGACCAGCA GGCAAAACAA AGCTAGAGAA ACAATT CCAG CTCCTGAGCC 3660 

AGTCAAATAT ACAGCAGAGT GACTATTCTG CAGCCCTAAA GCAATGCAAC AGGGAAAAGA 3720 

ATCGAACTTC TTCTAT CAT C CCTGTGGAAA GAT CAAGGGT TGGCATTTCA TCCCTGAGTG 3780 
GAGAAGGCAC AG ACT ACAT C AATGCCTCCT ATATCATGGG CTATTACCAG AGCAATGAAT 3840 
T CAT CATTAC CCAGCACCCT CTCCTTCATA CCATCAAGGA TTTCTGGAGG ATGATATGGG 3900 
ACCATAATGC CCAACTGGTG GTTATGATT C CTGATGGCCA AAACATGGCA GAAGATGAAT 3960 
TTGTTTACTG GCCAAATAAA GATGAGCCTA TAAATTGTGA GAGCTTTAAG GTCACTCTTA 4020 
TGGCTGAAGA ACACAAATGT CTAT CTAATG AGGAAAAACT TATAATTCAG GACTTTATCT 4080 
TAGAAGCTAC ACAGGATGAT TATGTACTTG AAGTGAGGCA CTTTCAGTGT CCTAAATGGC 4140 
CAAATCCAGA TAGCCCCATT AGTAAAACTT TTGAACTTAT AAGTGTTATA AAAGAAGAAG 4200 
CTGCCAATAG GGATGGGCCT ATGATTGTTC ATGATGAGCA TGGAGGAGTG ACGGCAGGAA 4260 
CTTTCTGTGC TCTGACAACC CTTATGCACC AACTAGAAAA AGAAAATTCC GTGGATGTTT 4320 
ACCAGGTAGC CAAGATGATC AATCTGATGA GGCCAGGAGT CTTTGCTGAC ATTGAGCAGT 4380 
ATCAGTTTCT CTACAAAGTG ATCCTCAGCC TTGTGAGCAC AAGGCAGGAA GAGAATCCAT 4440 
CCACCTCTCT GGACAGTAAT GGTGCAGCAT TGCCTGATGG AAATATAGCT GAGAGCTTAG 4500 
AGTCTTTAGT TTAACACAGA AAGGGGTGGG GGG ACT CACA TCTGAGCATT GTTTTCCTCT 4560 
TCCTAAAATT AGG C AGG AAA ATCAGT CTAG TTCTGTTATC TGTTGATTTC CCATCACCTG 4620 
ACAGTAACTT TCATGACATA GGATTCTGCC GCCAAATTTA TATCATTAAC AATGTGTGCC 4680 
TTTTTGCAAG ACTTGTAATT TACTTATTAT GTTTGAACTA AAATGATTGA ATTTTACAGT 4740 
ATTTCTAAGA ATGGAATTGT GGTATTTTTT TCTGTATTGA TTTTAACAGA AAATTTCAAT 480 0 
T T AT AGAGGT TAGGAATTCC AAACTACAGA AAATGTTTGT TTTTAGTGTC AAATTTTTAG 4860 
CTGTATTTGT AGCAATTATC AGGTTTGCTA GAAATATAAC TTTTAATACA GTAGCCTGTA 4920 
AATAAAACAC TCTTCCATAT GATATTCAAC ATTTTACAAC TGCAGTATTC ACCTAAAGTA 4980 
GAAATAATCT GTTACTTATT GTAAATACTG CCCTAGTGTC TCCATGGACC AAATTTATAT 5040 
TTATAATTGT AGATTTTTAT ATTTTACTAC TGAGTCAAGT TTTCTAGTTC TGTGTAATTG 5100 
TTTAGTTTAA TGACGTAGTT CATTAGCTGG TCTTACTCTA CCAGTTTTCT GACATTGTAT 5160 
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TGTGTTACCT AAGTCATTAA CTTTGTTTCA GCATGTAATT TTAACTTTTG TGGAAAATAG 
AAATACCTTC ATTTTGAAAG AAGTTTTTAT GAGAATAACA CCTTACCAAA CATTGTTCAA 
ATGGTTTTTA TCCAAGGAAT TGCAAAAATA AATATAAATA TTGCCATTAA AAAAAAAAAA 
AAAAAAAAAA AAAAAAAAAA AAA 

Seq ID NO: 186 Protein sequence: 
Protein Accession #: EOS sequence 
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1 

1 

MVFKASKITF 
LSILFEVGTE 
PCTDTVDWIV 
SYTGKEEIHE 
TKHEFLTDGY 
PELIGTEEII 
TNRSPTRGSE 
NDGSKTVLRS 
ISENISQGYI 
DITAQPDVGS 
FPTEVTPHAF 
IPLVIVSALT 
IPIKHFPKHV 
IVAYDHSRVK 
NVEVIVMITN 
KGSQKGRPSG 
RTGTYIVLDS 
E VLDSH I HAY 
PVERSRVGIS 
VM I PDGQNMA 
YVLEVRHFQC 
LMHQLEKENS 
GAALPDGN I A 



11 
i 

HWGKCNMSSD 
ENLDFKAI ID 
FKDTVSISES 
AVCSSEPENV 
QDLGAILNNL 
KEEEEGKDIE 
FSGKGDVPNT 
PHMNLSGTAE 
FSSENPETIT 
GRESFLQTNY 
TPSSRQQDLV 
FICIiWLVGI 
ADLHASSGFT 
LAQLAEKDGK 
LVEKGRRKCD 
RWTQYHYTQ 
MLQQIQHEGT 
VNALLIPGPA 
SLSGEGTDY I 
EDEFVYWPNK 
PKWPNPDSPI 
VDVYQVAKMI 
ESLESLV 



21 
i 

GSEHSLEGQK 
GVESVSRFGK 
QLAVFCEVLT 
QADPENYTSL 
LPNMSYVLQI 
EGAIVNPGRD 
SLNSTSQPVT 
SLNTVSITEY 
YDVLI PESAR 
TEIRVDESEK 
STVNWYSQT 
LIYWRKCFQT 
EEFETLKEFY 
LTDYINANYV 
QYWPADGSEE 
WPDMGVPEYS 
VNIFGFLKHI 
GKTKLEKQFQ 
NASYIMGYYQ 
DEPINCESFK 
SKTFELISVI 
NLMRPGVFAD 



31 

1 

FPLEMQIYCF 
QAALDPFILL 
MQQSGYVMLM 
LVTWERPRW 
VAICTNGLYG 
SATNQIRKKE 
KLATEKDISL 
EEESLLTSFK 
NASEDSTSSG 
TTKSFSAGPV 
TQPVYNEASN 
AHFYLEDSTS 
QEVQSCTVDL 
DGYNRPKAYI 
YGNFLVTQKS 
LPVLTFVRKA 
RSQRNYLVQT 
LLSQSNIQQS 
SNEFIITQHP 
VTLMAEEHKC 
KEEAANRDGP 
IEQYQFIiYKV 



41 

I 

DADRFSSFEE 
NLLPNSTDKY 
DYLQNNFREQ 
YDTMIEKFAV 
KYSDQLIVDM 
PQISTTTHYN 
TSQTVTELPP 
LDTGAEDSSG 
SEESLKDPSM 
MSQGPSVTDL 
S SHE SR I GL A 
PRVISTPPTP 
GITADSSNHP 
AAQGPLKSTA 
VQVLAYYTVR 
AYAKRHAVGP 
EEQYVFIHDT 
DYSAALKQCN 
IiLHTIKDFWR 
LSNEEKIiIIQ 
MIVHDEHGGV 
ILSLVSTRQE 



51 
I 

AVKGKGKLRA 
YIYNGSLTSP 
QYKFSRQVFS 
LYQQLDGEDQ 
PTDNPELDLF 
RIGTKYNEAK 
HTVEGTSASL 
SSPATSAIPF 
EGNVWFPSST 
EMPHYSTFAY 
EGLESEKKAV 
IFPISDDVGA 
DNKHKNRY IN 
EDFWRMIWEH 
NFTLRNTKIK 
VWHCSAGVG 
LVEAILSKET 
REKNRTSSII 
MIWDHNAQLV 
DFILEATQDD 
TAGTFCALTT 
ENPSTSLDSN 



Seq ID NO: 187 DNA sequence 

Nucleic Acid Accession #: EOS sequence 

Coding sequence: 148-4 632 



85 



CACACATACG 
CAAAAAAAAC 
CGGCGAGGGG 
CAGCTCCTCT 
CTTGTTGAAG 
AAATATCCAA 
CAAGTAAATG 
AACACATTCA 
GTCAGCGGAG 
AAATGCAATA 
GAGATGCAAA 
GGAAAAGGGA 
GATTT CAAAG 
TTAGAT CCAT 
AATGGCT CAT 
ACAGTTAGCA 
TCTGGTTATG 
TTCTCTAGAC 
AGT TCAGAAC 
TGGGAAAGAC 
CAGTTGGATG 
GGTGCTATTC 
TGCACTAATG 
AATCCTGAAC 
GAAGAGGGAA 
AACCAAATCA 
ACGAAATACA 
AAGGGTGATG 
ACAGAAAAAG 
.GAAGGTACTT 
AACTTGTCGG 
AGTTTATTGA 
GCAACTTCTG 
GAAAACCCAG 
GAAGATTCAA 
GTGTGGTTTC 
AGCTTTCTCC 
TCCTTTTCTG 
CATTATTCTA 
TCCAGACAAC 
GTATACAATG 
GAATCCGAGA 
CTAGTGGTTC 
TACTTAGAGG 
ATTT CAGATG 
CATGCAAGTA 
CAGAGCTGTA 



11 
I 

CACGCACGAT 
ATTTCCTTCG 
CCGCAGACCG 
GTGTTTGCCG 
AGATTGGCTG 
CATGTAATAG 
TGAATCTTAA 
TTCATAACAC 
GAGTTTCAGA 
TGTCAT CTGA 
TCTACTGCTT 
AGTTAAGAGC 
CGATTATTGA 
TCATACTGTT 
TGACATCTCC 
TCTCTGAAAG 
TCATGCTGAT 
AGGTGTTTTC 
CAGAAAATGT 
CTCGAGTCGT 
GAGAGGACCA 
TCAATAATTT 
GCTTATATGG 
TTGATCTTTT 
AAGACATTGA 
GGAAAAAGGA 
ATGAAGCCAA 
TTCCCAATAC 
ATATTTCCTT 
CAGCCTCTTT 
GGACTGCAGA 
CCAGTTTCAA 
CTATCCCATT 
AGACAATAAC 
CTTCATCAGG 
CTAGCTCTAC 
AGACTAATTA 
CAGGCCCAGT 
CCTTTGCCTA 
AGGATTTGGT 
AGGCCAGTAA 
AGAAGGCAGT 
TTGTGGGTAT 
ACAGTACATC 
ATGT CGGAGC 
GTGGGTTTAC 
CTGTTGACTT 



21 

! 

CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 
TGGGAAAACA 
AATGGTGTTT 
TGGAT CAGAG 
TGATGCGGAC 
TTTATCCATT 
TGGAGTCGAA 
GAACCTTCTG 
TCCCTGCACA 
CCAGTTGGCT 
GGACTACTTA 
CTCATACACT 
TCAGGCTGAC 
TTATGATACC 
AACCAAGCAT 
GCTACCCAAT 
AAAATACAGC 
CCCTGAATTA 
AGAAGGCGCT 
ACCCCAGATT 
GACTAACCGA 
ATCTTTAAAT 
GACTTCTCAG 
AAATGATGGC 
ATCCTTAAAT 
GCTTGATACT 
CATCTCTGAG 
ATATGATGTC 
TTCAGAAGAA 
AGACATAACA 
CACTGAGATA 
GATGT CACAG 
CTTCCCAACT 
CTCCACGGTC 
TAGTAGCCAT 
TATACCCCTT 
TCTCATCTAC 
CCCTAGAGTT 
AATTCCAATA 
TGAAGAATTT 
AGGTATTACA 



31 
I 

TCTATACACT 
CTCTCCACTC 
CGAATCCTAA 
GCTAATGGAT 
GGAGCACTGA 
TCTCCTATCA 
TTTCAGGGTT 
GTGGAAATTA 
AAAGCAAGCA 
CATAGTTTAG 
CGATTTTCAA 
TTGTTTGAGG 
AGTGTTAGTC 
CCAAACTCAA 
GACACAGTTG 
GTTTTTTGTG 
CAAAACAATT 
GGAAAGGAAG 
CCAGAGAATT 
ATGATTGAGA 
GAATTTTTGA 
ATGAGTTATG 
GACCAACTGA 
ATTGGAACTG 
ATTGTGAATC 
TCTACCACAA 
TCCCCAACAA 
TCCACTTCCC 
ACTGTGACTG 
TCTAAAACTG 
ACAGTTTCTA 
GGAGCTGAAG 
AACATATCCC 
CTTATACCAG 
TCACTAAAGG 
GCACAGCCCG 
CGTGTTGATG 
GGTCCCTCAG 
GAGGTAACAC 
AACGTGGTAT 
GAGT CTCGTA 
GTGATCGTGT 
TGGAGGAAAT 
ATATCCACAC 
AAGCACTTTC 
GAGACACTGA 
GCAGACAGCT 



41 

1 

GGAGGATTAA 
TGAGAAGCAG 
AACGTTTCCT 
ACTACAGACA 
ATCAAAAAAA 
ATATTGATGA 
GGGATAAAAC 
AT CTCACT AA 
AGATAACTTT 
AAGGACAAAA 
GTTTTGAGGA 
TTGGGACAGA 
GTTTTGGGAA 
CTGACAAGTA 
ACTGGATTGT 
AAGTT CTTAC 
TTCGAGAGCA 
AGATTCATGA 
ATACCAGCCT 
AGTTTGCAGT 
CAGATGGCTA 
TTCTTCAGAT 
TTGTCGACAT 
AAGAAATAAT 
CTGGTAGAGA 
CACACTACAA 
GAGGAAGTGA 
AACCAGTCAC 
AACTGCCACC 
TTCTTAGATC 
TAACAGAATA 
ATTCTTCAGG 
AAGGGTATAT 
AATCTGCTAG 
AT CCTTCT AT 
ATGTTGGATC 
AATCTGAGAA 
TTACAGATCT 
CTCATGCTTT 
ACTCGCAGAC 
TTGGTCTAGC 
CAGCCCTGAC 
GCTTCCAGAC 
CTCCAACACC 
CAAAG CAT GT 
AAGAGTTTTA 
CCAACCACCC 



51 



AACAAACAAA 
AGGAGCCGCA 
CGCTTGCATT 
ACAGAGAAAA 
TTGGGGAAAG 
AGATCTTACA 
ATCATTGGAA 
TGACTACCGT 
TCACTGGGGA 
ATTTCCACTT 
AGCAGTCAAA 
AGAAAATTTG 
GCAGGCTGCT 
TTACAT TTAC 
TTTTAAAGAT 
AATGCAACAA 
ACAGTACAAG 
AGCAGTTTGT 
TCTTGTTACA 
TTTGTACCAG 
TCAAGACTTG 
AGTAGCCATA 
GCCTACTGAT 
CAAGGAGGAG 
CAGTGCTACA 
TCGCATAGGG 
ATTCTCTGGA 
TAAATTAGCC 
TCACACTGTG 
TCCACATATG 
TGAGGAGGAG 
CTCCAGTCCC 
ATTTTCCTCC 
AAATGCTTCC 
GGAGGGAAAT 
AGGCAGAGAG 
GACAACCAAG 
GGAAATG CC A 
TACCCCATCC 
AACCCAACCG 
TGAGGGGTTG 
TTTTATCTGT 
TGCACACTTT 
TATCTTTCCA 
TGCAGATTTA 
CCAGGAAGTG 
AGACAACAAG 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 



262 



WO 02/086443 

CACAAGAATC GATACATAAA TATCGTTGCC TATGATCATA GCAGGGTTAA GCTAGCACAG 2 880 

CTTGCTGAAA AGGATGGCAA ACTGACTGAT TATATCAATG CCAATTATGT TGATGGCTAC 2 940 

AACAGACCAA AAGCTTATAT TGCTGCCCAA GGCCCACTGA AATCCACAGC TGAAGATTTC 3000 

TGGAGAATGA TATGGGAACA TAATGTGGAA GTTATTGTCA TGATAACAAA CCTCGTGGAG 3060 

AAAGGAAGGA GAAAATGTGA TCAGTACTGG CCTGCCGATG GGAGTGAGGA GTACGGGAAC 3120 

TTTCTGGTCA CTCAGAAGAG TGTGCAAGTG CTTGCCTATT ATACTGTGAG GAATTTTACT 3180 

CTAAGAAACA CAAAAATAAA AAAGGGCTCC CAGAAAGGAA GACCCAGTGG ACGTGTGGTC 3240 

ACACAGTATC ACTACACGCA GTGGCCTGAC ATGGGAGTAC CAGAGTACTC CCTGCCAGTG 33 00 

CTGACCTTTG TGAGAAAGGC AGCCTATGCC AAGCGCCATG CAGTGGGGCC TGTTGTCGTC 33 60 

CACTGCAGTG CTGGAGTTGG AAGAACAGGC ACATATATTG TGCTAGACAG TATGTTGCAG 3420 

CAGATTCAAC ACGAAGGAAC TGTCAACATA TTTGGCTTCT TAAAACACAT CCGTTCACAA 3480 

AGAAATTATT TGGTACAAAC TGAGGAGCAA TATGTCTTCA TTCATGATAC ACTGGTTGAG 3540 

GCCATACTTA GTAAAGAAAC TGAGGTGCTG GACAGT CAT A TTCATGCCTA TGTTAATGCA 3 600 

CTCCTCATTC CTGGACCAGC AGGCAAAACA AAGCTAGAGA AACAATTCCA GGGTCTCACT 3 660 

CTGTCACCCA GGCTGGAGTG CAGAGGCACA ATCTCGGCTC ACTGCAACCT TCCTCTCCCT 372 0 

GGCTTAACTG ATCCTCCTAC CTCAGCCTCC CGAGTGGCTG GGACTATACT CCTGAGCCAG 3780 

TCAAATATAC AGCAGAGTGA CTATTCTGCA GCCCTAAAGC AATGCAACAG GGAAAAGAAT 3840 

CGAACTTCTT CTATCATCCC TGTGGAAAGA TCAAGGGTTG GCATTTCATC CCTGAGTGGA 3 900 

GAAGGCACAG ACTACATCAA TGCCTCCTAT ATCATGGGCT ATTACCAGAG CAATGAATTC 3 960 

ATCATTACCC AGCACCCTCT CCTTCATACC ATCAAGGATT TCTGGAGGAT GATATGGGAC 4020 

CATAATGCCC AACTGGTGGT TATGATTCCT GATGG CCAAA ACATGGCAGA AGATGAATTT 40 80 

GTTTACTGGC CAAATAAAGA TGAGCCTATA AAT TGTGAGA GCTTTAAGGT CACTCTTATG 4140 

GCTGAAGAAC AC AAATGT CT ATCTAATGAG GAAAAACTTA TAATT CAGG A CTTTATCTTA 42 00 

GAAGCTACAC AGGATGATTA TGTACTTGAA GTGAGGCACT TTCAGTGTCC TAAATGGCCA 42 60 

AATCCAGATA GCCCCATTAG TAAAACTTTT GAACTTATAA GTGTTATAAA AGAAGAAGCT 432 0 

GCCAATAGGG ATGGGCCTAT GATTGTTCAT GATGAGCATG GAGGAGTGAC GGCAGGAACT 4380 

TTCTGTGCTC TGACAACCCT TATGCACCAA C T AG AAAAAG AAAATTCCGT GGATGTTTAC 4440 

CAGGTAGCCA AGATGAT CAA TCTGATGAGG CCAGGAGTCT TTGCTGACAT TGAGCAGTAT 4500 

CAGTTTCTCT ACAAAGTGAT CCTCAGCCTT GTGGGCACAA GGCAGGAAGA GAATCCATCC 4560 

ACCTCTCTGG ACAGTAATGG TG C AG CAT T G CCTGATGGAA ATATAGCTGA GAGCTTAGAG 462 0 

TCTTTAGTTT AACACAGAAA GGGGTGGGGG GACT CACATC TGAGCATTGT TTTCCTCTTC 4680 

CTAAAATTAG GCAGGAAAAT CAGTCTAGTT CTGTTATCTG TTGATTTCCC ATCACCTGAC 4740 

AGTAACTTTC ATGACATAGG ATTCTGCCGC CAAATTTATA TCATTAACAA TGTGTGCCTT 480 0 

TTTGCAAGAC TTGTAATTTA CTTATTATGT TTGAACTAAA ATGATTGAAT TTTACAGTAT 4860 

TTCTAAGAAT GGAATTGTGG TATTTTTTTC TGTATTGATT TTAACAGAAA ATTTCAATTT 4920 

ATAGAGGTTA GGAATTCCAA ACTACAGAAA ATGTTTGTTT TTAGTGTCAA ATTTTTAGCT 4980 

GTATTTGTAG CAATT AT CAG GTTTGCTAGA AATATAACTT TTAATACAGT AGCCTGTAAA 5040 

TAAAACACTC TTCCATATGA TATTCAACAT TTTACAACTG CAGTATTCAC CTAAAGTAGA 5100 

AATAATCTGT TACTTATTGT AAATACTGCC CTAGTGTCTC CATGGACCAA ATTTATATTT 5160 

ATAATTGTAG ATTTTTATAT TTTACTACTG AGTCAAGTTT TCTAGTTCTG TGTAATTGTT 5220 

TAGTTTAATG ACGTAGTTCA TTAGCTGGTC TTACTCTACC AGTTTTCTGA CATTGTATTG 5280 

TGTTACCTAA GTCATTAACT TTGTTTCAGC ATGTAATTTT AACTTTTGTG GAAAATAGAA 5340 

ATACCTTCAT TTTGAAAGAA GTTTTTATGA GAATAACACC TTACCAAACA TTGTT CAAAT 5400 

GGTTTTTATC CAAGGAATTG CAAAAATAAA TATAAATATT GCCATTAAAA AAAAAAAAAA 5460 
AAAAAAAAAA AAAAAAAAAA A 

Seq ID NO: 188 Protein sequence: 
Protein Accession #: EOS sequence 

1 11 21 31 41 51 

1 I I I I I 

MRILKRFLAC IQLLCVCRLD WANGYYRQQR KLVEEIGWSY TGALNQKNWG KKYPTCNSPK 60 

QSPINIDEDL TQVNVNLKKL KFQGWDKTSL ENTFIHNTGK TVEINLTNDY RVSGGVSEMV 12 0 

FKASKITFHW GKCNMSSDGS EHSLEGQKFP LEMQIYCFDA DRFSSFEEAV KGKGKLRALS 180 

ILFEVGTEEN LDFKAIIDGV ESVSRFGKQA ALDPFILLNL LPNSTDKYYI YNGSLTSPPC 240 

TDTVDWIVFK DTVSISESQL AVFCEVLTMQ QSGYVMLMDY LQNNFREQQY KFSRQVFSSY 300 

TGKEEIHEAV CSSEPENVQA DPENYTSLLV TWERPRWYD TMIEKFAVLY QQLDGEDQTK 360 

HEFIjTDGYQD LGAILNNLLP NMSYVLQIVA ICTNGLYGKY SDQLIVDMPT DNPELDLFPE 420 

LIGTEEIIKE EEEGKDIEEG AIVNPGRDSA TNQIRKKEPQ ISTTTHYNRI GTKYNEAKTN 480 

RSPTRGSEFS GKGDVPNTSL NSTSQPVTKL ATEKDISLTS QTVTELPPHT VEGTSASLND 540 

GSKTVLRSPH MNLSGTAESL NTVSITEYEE ESLLTSFKLD TGAEDSSGSS PATSAIPFIS 600 

ENISQGYIFS SENPET I T YD VLIPESARNA SEDSTSSGSE ESLKDPSMEG NVWFPSSTDI 660 

TAQ PDVGSGR ESFLQTNYTE IRVDESEKTT KSFSAGPVMS QGPSVTDLEM PHYSTFAYFP 720 

TEVTPHAFTP SSRQQDLVST VNWYSQTTQ PVYNEASNSS HESRIGLAEG LESEKKAVIP 780 

LVIVSALTFI CLWLVGILI YWRKCFQTAH FYLEDSTSPR VISTPPTPIF PISDDVGAIP 840 

IKHFPKHVAD LHASSGFTEE FETLKEFYQE VQSCTVDLGI TADSSNHPDN KHKNRYINIV 900 

AYDHSRVKLA QLAEKDGKLT DYINANYVDG YNRPKAY I AA QGPLKSTAED FWRMIWEHNV 960 

EVIVMITNLV EKGRRKCDQY WPADGSEEYG NFLVTQKSVQ VLAYYTVRNF TLRNTKIKKG 1020 

SQKGRPSGRV VTQYHYTQWP DMGVPEYSLP VLTFVRKAAY AKRHAVGPW VHCSAGVGRT 1080 

GTYIVLDSML QQIQHEGTW IFGFLKHIRS QRNYLVQTEE QYVFIHDTLV EAILSKETEV 1140 

LDSHIHAYVN ALL I PGPAGK TKLEKQFQGL TLSPRLECRG TISAHCNLPL PGLTDPPTSA 1200 

SRVAGT ILLS QSNIQQSDYS AALKQCNREK NRTSSIIPVE RSRVGISSLS GEGTDYINAS 12 60 

YIMGYYQSNE FIITQHPLLH TIKDFWRMIW DHNAQLWMI PDGQNMAEDE FVYWPNKDEP 1320 

INCESFKVTL MAEEHKCLSN EEKLIIQDFI LEATQDDYVL EVRHFQCPKW PNPDSPISKT 1380 

FELISVIKEE AANRDGPMIV HDEHGGVTAG TFCALTTLMH QLEKENSVDV YQVAKMINLM 1440 
RPGVFADIEQ YQFLYKVILS LVGTRQEENP STSLDSNGAA LPDGNIAESL ESLV 



Seq ID NO: 189 DNA sequence 
Nucleic Acid Accession #: NM_002820 
Coding sequence: 304.. 831 

1 11 21 31 41 51 

1 1 I I I 1 

CCGGTTCGCA AAGAAGCTGA CTT CAGAGGG GGAAACTTTC TTCTTTTAGG AGGCGGTTAG 60 
CCCTGTTCCA CGAACCCAGG AGAACTGCTG GCCAGATTAA TTAGACATTG CTATGGGAGA 120 
CGTGTAAACA CACTACTTAT CATTGATGCA TATATAAAAC CATTTTATTT TCGCTATTAT 180 



i 



263 



WO 02/086443 

TTCAGAGGAA GCGCCTCTGA 
GTTTGGAGAA AGCACAGTTG 
ACGATGCAGC GGAGACTGGT 
GTGCCCTCCT GCGGGCGCTC 
GAACATCAGC TCCTCCATGA 
CTTCACCATC TGAT CGCAGA 
CCTAACTCCA AGCCCTCTCC 
GAGGGCAGAT ACCTAACTCA 
AAGACACCTG GGAAGAAAAA 
AAACGGCGAA CTCGCTCTGC 
GACCACCTGT CTGACACCTC 
CTGGCCCGTA GCCTCAGCGG 
GCTTGGACAA ACCTAGAATT 
CAGAGAATAA CTCAGAATAT 
TGTCCTCCAG CACCATAGAG 
CATCAATCCT TTACCACTCT 
ATCTTCATAA TTTGCTGGAG 
TTCTTCAGTG TTTTTCATTT 
GAT ATT AT CT ACAAACACTG 
ACTTTTTATT TAATTAAATG 
TAAATTATGT TTTAAACACA 
CCAGCTCATA CAAAATAAAT 
GGTTTTTCTC ATGTATCTTT 
CCGTAGGAAA AATAAAACTT 



TTTGTTTCTT TTTTCCCTTT 
GAGTAGCCGG TTGCTAAATA 
TCAGCAGTGG AG CGTCGCGG 
GGTGGAGGGT CTCAGCCGCC 
CAAGGGGAAG TCCATCCAAG 
AATCCACACA GCTGAAATCA 
CAACACAAAG AACCACCCCG 
GGAAACTAAC AAGGTGGAGA 
GAAAGGCAAG CCCGGGAAAC 
CTGGTTAGAC TCTGGAGTGA 
CACAACGTCG CTGGAGCTCG 
GGTGCTCTCA GCTGGGTTTT 
TTCTCCCTTT ATGTATCTCT 
TGT CTGCCTT AAAGCAGTAC 
AGGCGCTAGA GCCCATTCCT 
ACCAAATAAT TTCATATTCA 
AAGTGTATTT CTTCCCCTTA 
CTTACGTTCT TTCACTTCAA 
C AG AAC AG C A TC ATGT CAT A 
TATTTAATTA AATCTCAAAT 
TGCCTTAAAT TTGTTTAATT 
GGTTTCTGAA AATGTTTAAG 
TTGTTCATTG GCAAGATGAA 
CACATTTAAA AAAAA 



TTGCTCTTTC TGGCTGTGTG 
AGTCCCGAGC GCGAGCGGAG 
TGTTCCTGCT GAGCTACGCG 
GCCTCAAAAG AGCTGTGTCT 
ATTTACGGCG ACGATTCTTC 
GAGCTACCTC GGAGGTGTCC 
TCCGAT TTGG GTCTGATGAT 
CGTACAAAGA GCAGCCGCTC 
GCAAGGAGCA GGAAAAGAAA 
CTGGGAGTGG GCTAGAAGGG 
ATTCACGGTA ACAGGCTTCT 
GGAGCCTCCC TTCTGCCTTG 
ATCGATTGTG TAGCAATTGA 
CCCCCTACCA CACACACCCC 
CTTTCTCCAC CGTCACCCAA 
AGCTTCAGAA GCTAGTGACC 
CTCTCACACC TGGGCAAACT 
GGGAGAATAT AGAAGCATTT 
AACGATTCTG AGCCATTCAC 
TTATTTTAAT GTAAAGAACT 
AAATTTAACT CTGGTTTCTA 
TATTAACTTA CAAGGATATA 
ATAATTTTTC TAGGGTAATG 



Seq ID NO: 190 Protein sequence: 
Protein Accession #: NP__002811 



1 11 21 31 41 51 

I I I I I I 

MQRRLVQQWS VAVFLLSYAV PSCGRSVEGL SRRLKRAVSE HQLLHDKGKS IQDLRRRFFL 

HHLIAEIHTA EIRATSEVSP NSKPSPNTKN HPVRFGSDDE GRYLTQETNK VETYKEQPLK 

TPGKKKKGKP GKRKEQEKKK RRTRSAWLDS GVTGSGLEGD HLSDTSTTSL ELDSR 

Seq ID NO: 191 DNA sequence 
Nucleic Acid Accession #: XM_0S9328 
Coding sequence: 52.. 1023 

1 11 21 31 41 51 

l I I l I I 

GGGCTGTCCG GCCCACTCCC CTGGGAGCGC GAG CGGTGGA CCCAGGCGGC CATGTCCCGC 
CCTCGCATGC GCCTGGTGGT CACCGCGGAC GACTTTGGTT ACTGCCCGCG ACGCGATGAG 
GGTATCGTGG AGGCCTTTCT GGCCGGGGCT GTGACCAGCG TGTCCCTGCT GGT CAACGGT 
GCGGCCACGG AGAGCGCGGC GGAGCTGGCC CGCAGGCACA GCATCCCCAC GGGCCTCCAC 
GCCAACCTGT CCGAGGGCCG CCCCGTGGGT CCGGCCCGCC GTGGCGCCTC ATCGCTGCTC 
GGCCCGGAAG GCTTCTTCCT TGGCAAGATG GGATTCCGGG AGGCGGTGGC GGCCGGAGAC 
GTGGATTTGC CTCAGGTGCG GGAGGAGCTC GAGGCCCAAC TAAGCTGCTT CCGGGAGCTG 
CTGGGCAGGG CCCCCACGCA CGCGGACGGG CACCAGCACG TGCACGTGCT CCCAGGCGTG 
TGCCAGGTGT TCGCCGAGGC GCTGCAGGCC TATGGGGTGC GCTTTACGCG ACTGCCGCTG 
GAGCGCGGTG TGGGTGGCTG CACTTGGCTG GAGGCCCCCG CGCGTGCCTT CGCCTGCGCC 
GTGGAGCGCG ACGCCCGGGC CGCCGTGGGC CCCTTCTCCC GCCACGGCCT GCGGTGGACA 
GACGCCTTCG TGGGCCTGAG CACTTGCGGC CGGCACATGT CCGCTCACCG CGTGTCCGGG 
GCCCTGGCGC GGGTCCTGGA AGGTACCCTA GCGGGCCACA CCCTGACAGC CGAGCTGATG 
GCGCACCCCG GCTACCCCAG TGTGCCTCCC ACCGGCGGCT GCGGTGAAGG CCCCGACGCT 
TTCTCTTGCT CTTGGGAGCG GCTGCATGAG CTGCGCGTCC TCACCGCGCC CACGCTGCGG 
GCCCAGCTTG CCCAGGATGG CGTGCAGCTT TGCGCCCTCG ACGACCTGGA CTCCAAGAGG 
CCAGGGGAGG AGGTCCCCTG TGAGCCCACT CTGGAACCCT TCCTGGAACC CTCCCTACTC 
TGACCCCCTA CAGACAACCA AGCACTAATC CCCTTAGTAC CAAGAAAGGG GAGCCAGGAT 
TTAGTCCTGG CCCAGCCCAG AGCTGGGACC TGGAGCACGA TCTGTTGACT TCCCTGGGTA 
GGACACTGCC ACCTCTGGGC TCAGGTCCTC ATGCCTCCAA ATGGCATCTA GAGTTTGAGC 
AGCCTTCTTG GCTGCAGGCA GGCCTAGCCT GTGGCAGCGG GCTAGGGCCC GCAGAGCATT 
TGGTGCCCCT CCATGTTGCA ATGCAAACAC CTTCACCACT GGGGCAGTGG GGAGAGATGG 
CTATATTAAT AAAATAACGT GTGTCTTTC 

Seq ID NO: 192 Protein sequence: 
Protein Accession #: XP 059328 



1 11 21 31 41 51 

I I I I I I 

MSRPRMRLW TADDFGYCPR RDEGIVEAFL AGAVTSVSLL VNGAATESAA ELARRHSIPT 
GLHANLSEGR PVGPARRGAS SLLGPEGFFL GKMGFREAVA AGDVDLPQVR EELEAQLSCF 
RELLGRAPTH ADGHQHVHVL PGVCQVFAEA LQAYGVRFTR LPLERGVGGC TWLEAPARAF 
ACAVERDARA AVGPFSRHGL RWTDAFVGLS TCGRHMSAHR VSGALARVLE GTLAGHTLTA 
ELMAHPGYPS VPPTGGCGEG PDAFSCSWER LHELRVLTAP TLRAQLAQDG VQLCALDDLD 
SKRPGEEVp'c EPTLEPFLEP SLL 

Seq ID NO: 193 DNA sequence 

Nucleic Acid Accession #: NM_005688.1 

Coding sequence: 126.. 4439 

1 11 21 31 41 51 

I I I I I I 

CCGGGCAGGT GGCTCATGCT CGGGAGCGTG GTTGAGCGGC TGGCGCGGTT GTCCTGGAGC 

AGGGGCGCAG GAATTCTGAT GTGAAACTAA CAGTCTGTGA GCCCTGGAAC CTCCGCTCAG 
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AGAAGATGAA GGATATCGAC 
GTGTGAGGGA GAGAACCAGC 
GGAGAACTCG ACCGTTGGAA 
TCTCTCTTGA TGCCTCCATG 
GAAAGTACCA TCATGGCTTG 
ACCCAGTGGA CAATGCTGGG 
CCCGTGTGGC CCACAAGAAG 
ACGAGTCTTC TGACGTGAAC 
AAGTTGGGCC AGACGCTGCT 
TCATCCTGTC CAT CGTGTGC 
TCATGGTGAA ACACCTCTTG 
TGTTGTTAGT GCTGGGCCTC 
CTTGGGCATT GAATTACCGA 
TTAAGAAGAT CCTTAAGTTA 
TTTGCTCCAA CGATGGGCAG 
GAGGACCCGT TGTTGCCATC 
GCTTCCTGGG ATCAGCTGTT 
TCACAGCATA TTTCAGGAGA 
ATGAAGTTCT TAGTTACATT 
AGAGTGTTCA AAAAATCCGC 
AGGGTATCAC TGTGGGTGTG 
CTGTTCATAT GACCCTGGGC 
TCTTCAATTC CATGACTTTT 
AAGCCTCAGT GGCTGTTGAC 
TAAAGAACAA ACCAG CCAGT 
GGGACTCCTC CCACTCCAGT 
ACAAGAGGGC TTCCAGGGGC 
AGGCGGTGCT GGCAGAGCAG 
CCGAAGAGGA AGAAGGCAAG 
ACAGCATCGA TCTGGAGATC 
GTGGAAAAAC CTCTCTCATT 
TTGCAAT CAG TGGAACCTTC 
TGAGAGACAA CATCCTGTTT 
ACAGCTGCTG CCTGAGGCCT 
GAGAGCGAGG AGCCAACCTG 
TGTATAGTGA CAGGAGCATC 
TGGGCAACCA CATCTTCAAT 
TTGTTACCCA CCAGTTACAG 
GCTGTATTAC GGAAAGAGGC 
CCATTTTTAA TAACCTGTTG 
AAACCAGTGG TTCACAGAAG 
AGGAAAAAGC AGTAAAGCCA 
GTTCAGTGCC CTGGTCAGTA 
TCCTGGTTAT TATGGCCCTT 
GGTTGAGTTA CTGGAT CAAG 
CCTCGGTGAG TGACAGCATG 
CCCTCTCCAT GGCAGTCATG 
GCACGCTGCG AGCTTCCTCC 
CTATGAAGTT TTTTGACACG 
TGGATGAAGT TGACGTGCGG 
TGGTGTTCTT CTGTGTGGGA 
GGCCCCTTGT CATCCTCTTT 
TGAAGCGTCT GGACAATATC 
AGGGCCTTGC CACCATCCAC 
AGCTGCTGGA TGACAACCAA 
CTGTGCGGCT GGACCTCATC 
TTATGCACGG GCAGATTCCC 
TAACGGGGCT GTTCCAGTTT 
CGGTGGAGAG GATCAATCAC 
AGAACAAGGC TCCCTCCCCT 
AGATGAGGTA CCGAGAAAAC 
CTAAAGAGAA GATTGGCATT 
CCCTCTTCCG TCTGGTGGAG 
GTGATATTGG CCTTGCCGAC 
TGTTCAGTGG CACTGTCAGA 
TTTGGGATGC CCTGGAGAGG 
TTGAAT CTGA AGTGATGGAG 
GCATAGCTAG AGCCCTGCTC 
CCATGGACAC AGAGACAGAC 
GTACCATGCT GACCATTGCC 
TGCTGGCCCA GGGACAGGTG 
GTTCCCGATT CTATGCCATG 
TCCTCCCTGT TGACGAAGTC 
CCCCTCATCG CGTCCTCCTA 
GTTCCGGATT GGCTTGTGTG 
ATTCCATATT CATGTAAACA 
GGGAACCGTT ATTATAATTG 
TCTATATATA ATTCTGTACA 
TATTAAAATA AGCACTGTGC 
TTGCTGTACT AGAGATCTGG 
CTCTAGCTGG TGGTTTCACG 
ATAGTGGGCC CTCCGACAGC 
GAGACGGGTG GGCGGCTGGA 
CTGTCCTGGT GTCACTTACT 
TTTCACTCCC T CCATCAAGA 
TTTCCTGCCT TCTTCTTTTT 
TCCCACTGCC TCAGGTTCCT 
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ATAGGAAAAG 
ACTTCTGGGA 
TGCCAAGATG 
CATTCTCAGC 
AGTGCTCTGA 
CTTTTTTCCT 
GGGGAGCTCT 
TGCAGAAGAC 
TCCCTGCGAA 
CTGATGATCA 
GAGTATACCC 
CTCCTGACGG 
ACCGGTGTCC 
AAGAACATTA 
AGAATGTTTG 
TTAGGCATGA 
TTTATCCTCT 
AAATGCGTGG 
AAATTT AT CA 
GAGGAGGAGC 
GCTCCCATTG 
TTCGATCTGA 
GCTTTGAAAG 
AGATTTAAGA 
CCTCACATCA 
ATCCAGAACT 
AAGAAAGAGA 
AAAGGCCACC 
CACATCCACC 
CAAGAGGGTA 
TCAGCCATTT 
GCTTATGTGG 
GGGAAGGAAT 
GACCTGGCCA 
AGCGGTGGGC 
TACATCCTGG 
AGTGCTATCC 
TACCTGGTTG 
ACCCATGAGG 
CTGGGAGAGA 
AAGTCACAAG 
GAGGAAGGGC 
TATGGTGTCT 
TTCATGCTGA 
CAAGGAAGCG 
AAGGACAATC 
CTGATCCTGA 
CGGCTGCATG 
ACCCCCACAG 
CTGCCGTTCC 
ATGATCGCAG 
TCAGTCCTGC 
ACGCAGTCAC 
GCCTACAATA 
GCTCCTTTTT 
AGCATCGCCC 
CCAGCCTATG 
ACGGTCAGAC 
TACATTAAGA 
GACTGGCCCC 
CTCCCTCTTG 
GTGGGGCGGA 
TT AT CTGGAG 
CTCCGAAGCA 
TCAAATTTGG 
ACACACATGA 
AATGGGGATA 
CGCCACTGTA 
TTATTGATTC 
CATCGCCTGC 
GTGGAGTTTG 
TTTGCTGCTG 
TCTTTTCTTT 
CCGAAACCTT 
TTTCACTTTT 
AAATTTAGTT 
TATCAGAGGC 
TAGCCTATAT 
TAATAACAGT 
TTTTGCTATT 
GTGCCAGGTT 
CCCCTCTGCC 
GACCATGCAG 
GTTTCTGTCA 
ATGGGGAT CA 
GCTGTTGTTT 
ATGGCTGGCC 



AGTATATCAT 
CGCACAGAGA 
CCTTGGAAAC 
TCAGAATCCT 
AGCCCATCCG 
GTATGACTTT 
CAATGGAAGA 
TAGAGAGACT 
GGGTTGTGTG 
CGCAGCTGGC 
AGGCAACAGA 
AAATCGTGCG 
GCTTGCGGGG 
AAGAGAAATC 
AGG CAGCAGC 
TTTATAATGT 
TTTACCCAGC 
CCGCCACGGA 
AAATGTATGC 
GTCGGATATT 
TGGTGGTGAT 
CAGCAGCACA 
TAACACCGTT 
GTTTGTTTCT 
AGATAGAGAT 
CGCCCAAGCT 
AGGTGAGGCA 
TCCTCCTGGA 
TGGGCCACCT 
AACTGGTTGG 
TAGGCCAGAT 
CCCAGCAGGC 
ATGATGAAGA 
TTCTTCCCAG 
AGCGCCAGAG 
ACGACCCCCT 
GGAAACATCT 
ACTGTGATGA 
AACTGATGAA 
CACCGCCAGT 
ACAAGGGTCC 
AGCTTGTGCA 
ACATCCAGGC 
ATGTAGGCAG 
GGAACACCAC 
CTCATATGCA 
AAGCCATTCG 
ACGAGCTTTT 
GGAGGATTCT 
AGGCCGAGAT 
GAGTCTTCCC 
ACATTGTCTC 
CTTTCCTCTC 
AAGGGCAGGA 
TTTTGTTTAC 
TCATCACCAC 
CGGGTCTCGC 
TGGCATCTGA 
CTCTGTCCTT 
AGGAGGGAGA 
TCCTAAAGAA 
CAGGATCAGG 
GCTGCATCAA 
AACTCTCTAT 
ACCCCTTCAA 
AAGAATGTAT 
ACTTCTCAGT 
AGATTCTGAT 
AAGAGACCAT 
ACACGGTTCT 
ACACCCCATC 
CAGAGAACAA 
AGAG CATTGC 
GCCTTTCTCG 
AGGGAGAGTC 
TTTGTTCTTA 
CTATAATGAA 
TTACAGTGAA 
GCATATTCCT 
AGACTGTAGG 
TTCTGGGTGT 
GCCTCCCCAC 
AGCGCCGTGA 
GGAGAGCAGC 
CAGAGACATT 
CTAAACAAGA 
AC TG CACAG A 



CCCCAGTCCT 
CCGTGAAGAT 
AGCAGCCCGA 
GGATGAGGAG 
GACTACTTCC 
TTCGTGGCTT 
CGTGTGGTCT 
GTGGCAAGAA 
GATCTTCTGC 
TGGCTTCAGT 
GTCTAACCTG 
GTCTTGGTCG 
GGCCATCCTA 
CCTGGGTGAG 
CGTTGGCAGC 
AATTATTCTG 
AATGATGTTT 
TGAACGTGTC 
CTGGGTCAAA 
GGAAAAAGCC 
TGCCAGCGTG 
GGCTTTCACA 
TTCAGTAAAG 
AATGGAAGAG 
GAAAAATGCC 
GACCCCCAAA 
GCTGCAGCGC 
CAGTGACGAG 
GCGCTTACAG 
AATCTGCGGC 
GACGCTTCTA 
CTGGATCCTC 
AAGATACAAC 
CAGCGACCTG 
GAT CAGCCTT 
CAGTGCCTTA 
CAAGT C CAAG 
AGTGATCTTC 
TTTAAATGGT 
TGAGATCAAT 
TAAAACAGGA 
GCTGGAAGAG 
TGCTGGGGGC 
CACCGCCTTC 
TGTGACTCGA 
GTACTATGCC 
AGGAGTTGTC 
CCGAAG GAT C 
CAACAGGTTT 
GTTCATCCAG 
GTGGTTCCTT 
CAGGGTCCTG 
CCACATCACG 
GTTTCTGCAC 
GTGTGCGATG 
CACGGGGCTG 
CATCTCTTAT 
GACAGAAGCT 
GGAAGCACCT 
GGTGACCTTT 
AGTATCCTTC 
GAAGTCCTCG 
GATTGATGGA 
CATTCCTCAA 
CCAGTACACT 
TGCTCAGCTA 
GGGGGAACGG 
TTTAGATGAA 
CCGAGAAGCA 
AGGCTCCGAT 
GGTCCTTCTG 
GGTCGCTGTC 
CATTCCCTGC 
ATTTTATCTT 
ATATTTTGAT 
ATTGCACTCT 
GCTTTATACG 
AATGTAAGCT 
TTCTATCATT 
AAGAGTAGCA 
CCAAAGGAAG 
AGCCGCTCCA 
GTTCTCAGGG 
GGGG CGAAGC 
CCTCCGAGCC 
ATCAGTCTAT 
GCTCTCCAGC 



GGGTATAGAA 180 

TCCAAGTTCA 240 

GCCGAGGGCC 3 00 

CATCCCAAGG 3 60 

AAACACCAGC 42 0 

TCTTCTCTGG 480 

CTGTCCAAGC 540 

GAGCTGAATG 600 

CGCACCAGGC 660 

GGACCAGCCT 72 0 

CAGTACAGCT 780 

CTTGCACTGA 840 

ACCATGGCAT 900 

CT CAT C AAC A 960 

CTGCTGGCTG 1020 

GGACCAACAG 10 80 

GCATCACGGC 1140 

CAGAAGATGA 1200 

GCATTTTCTC 12 60 

GGGTACTTCC 132 0 

GTGACCTTCT 13 80 

GTGGTGACAG 1440 

TCCCTCTCAG 1500 

GTTCACATGA 1560 

ACCTTGGCAT 1620 

ATGAAAAAAG 1680 

ACTG AG CAT C 1740 

CGGCCCAGTC 1800 

AGGACACTGC 1860 

AGTGTGGGAA 192 0 

GAGGGCAGCA 1980 

AATGCTACTC 2040 

TCTGTGCTGA 2100 

ACGGAG AT TG 2160 

GCCCGGGCCT 2220 

GATGCCCATG 2280 

ACAGTTCTGT 2340 

ATGAAAGAGG 240 0 

GACTATGCTA 2460 

TCAAAAAAGG 2520 

TCAGTAAAGA 2580 

AAAGGGCAGG 2640 

CCCTTGGCAT 2700 

AGCACCTGGT 2 760 

GGGAACGAG A 2 82 0 

AGCATCTACG 2 880 

TTTGTCAAGG 2940 

CTTCGAAGCC 3 000 

TCCAAAGACA 3 060 

AACGTTATCC 3120 

GTGGCAGTGG 3180 

ATTCGGGAGC 324 0 

TCCAGCATAC 33 00 

AGATACCAGG 3360 

CGGTGGCTGG 3420 

AT GAT CGTT C 34 80 

GCTGTCCAGT 3540 

CGATTCACCT 3 600 

GCCAGAATTA 3 660 

GAGAACGCAG 3 72 0 

ACGATCAAAC 9 3780 

CTGGGGATGG 3840 

GTGAGAATCA 3900 

GAGCCGGTGC 3960 

GAAGACCAGA 402 0 

CCTCTGAAAC 4080 

CAGCTCTTGT 4140 

GCCACAGCTG 4200 

TTTGCAGACT 4260 

AGGATTATGG 4320 

TCCAACGACA 4380 

AAGGGCTGAC 4440 

CTGGGGCGGG 4500 

TCG CACAG CA 4560 

TATTGTATTT 462 0 

AAAAGGTTCA 4680 

TGTAGCTATA 4740 

GTTTATTTTA 4800 

TTTGTACAGT 4860 

TTT CATTCTT 4920 

ACGTGTGGCA 4980 

GGGGTGGCTG 5040 

CTCCTGCCTT 5100 

CCAGGCCCCT 5160 

GGGGAGTTTC 522 0 

CCACAGAGAG 52 80 

TCCAAGACCT 5340 



265 
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GTTGGTTCCA AGCCCTGGAG CCAACTGCTG CTTTTTGAGG TGGCACTTTT TCATTTGCCT 5400 

ATTCCCACAC CTCCACAGTT CAGTGGCAGG GCTCAGGATT TCGTGGGTCT GTTTTCCTTT 5460 

CTCACCGCAG TCGTCGCACA GTCTCTCTCT CTCTCTCCCC TCAAAGTCTG CAACTTTAAG 5520 

CAGCTCTTGC TAATCAGTGT CTCACACTGG CGTAGAAGTT TTTGTACTGT AAAGAGACCT 5580 

ACCTCAGGTT GCTGGTTGCT GTGTGGTTTG GTGTGTTCCC GCAAACCCCC TTTGTGCTGT 5640 

GGGGCTGGTA GCTCAGGTGG GCGTGGTCAC TGCTGTCATC AGTTGAATGG TCAGCGTTGC 5700 

ATGTCGTGAC CAACTAGACA TTCTGTCGCC TTAGCATGTT TGCTGAACAC CTTGTGGAAG 5760 

CAAAAATCTG AAAATGTGAA TAAAATTATT TTGGATTTTG TAAAAAAAAA AAAAAAAAAA 5820 
AAAAAAAAAA AAAAAAAA 

Seq ID NO: 194 Protein sequences 
Protein Accession #: NP_005679.1 



MKDIDIGKBY IIPSPGYRSV RERTSTSGTH RDREDSKFRR TRPLECQDAL ETAARAEGIj S 60 

LDASMHSQLR ILDEEHPKGK YHHGLSALKP IRTTSKHQHP VDNAGLFS CM TFSWLSSLAR 12 0 

VAHKKGELSM EDVWSLSKHE SSDVNCRRLE RLWQEELNEV GPDAASLRRV VWIFCRTRLI 180 

LSIVCLMITQ LAGFSGPAFM VKHLLEYTQA TESNLQYSLL LVLGLLLTEI VRSWSLALTW 240 

ALNYRTGVRL RGAILTMAFK KILKLKNIKE KSLGELINIC SNDGQRMFEA AAVGSLLAGG 300 

PWAILGMIY NVIILGPTGF LGSAVFILFY PAMMFASRL»T AYFRRKCVAA TDERVQKMNE 360 

VLTYIKFIKM YAWVKAFSQS VQKIREEERR ILEKAGYFQG ITVGVAPIW VIASWTFSV 420 

HMTLGFDLTA AQAFTWTVF NSMTFALKVT PFSVKSLSEA SVAVDRFKSL FLMEEVHMIK 480 

NKPASPHIKI EMKNATLAWD SSHSSIQNSP KLTPKMKKDK RASRGKKEKV RQLQRTEHQA 540 

VLAEQKGHIiIi LDSDERPSPE EEEGKHIHLG HLRLQRTLHS IDLEIQEGKL VGICGSVGSG 600 

KTSLISAILG QMTLLEGSIA I SGTFAYVAQ QAWILNATLR DNILFGKEYD EERYNSVLNS 660 

CCLRPDLAIL PSSDLTEIGE RGANLSGGQR QRISLARALY SDRSIYILDD PLSALDAHVG 72 0 

NHIFNSAIRK HLKSKTVLFV THQLQYLVDC DEVI FMKEGC ITERGTHEEL MNLNGD YAT I 780 

FNNLLLGETP PVEINSKKET SGSQKKSQDK GPKTGSVKKE KAVKPEEGQL VQLEEKGQGS 840 

VPWSVYGVYI QAAGGPLAFL VIMALFMLNV GSTAFSTWWL SYWIKQGSGN TTVTRGNETS 900 

VSDSMKDNPH MQYYASIYAL SMAVML I LKA IRGWFVKGT LRASSRLHDE LFRRILRSPM 960 

KFFDTTPTGR ILNRFSKDMD EVDVRLPFQA EMFIQNVILV FFCVGMIAGV FPVJFLVAVGP 1020 

LVILFSVLHI VSRVLIRELK RLDNITQSPF USHITSSIQG IiATIHAYNKG QEFLHRYQEL 1080 

LDDNQAPFFL FTCAMRWLAV RLDLISIALI TTTGLMIVLM HGQIPPAYAG LAI S YAVQLT 1140 

GLFOFTVRLA SETEARFTSV ERINHYIKTL SLEAPARIKN KAPSPDWPQE GEVTFENAEM 1200 

RYRENLPLVL KKVSFTIKPK EKIGIVGRTG SGKSSLGMAL FRLiVELiSGGC IKIDGVRISD 1260 

IGLADLRSKL SIIPQEPVLF SGTVRSNLDP FNQYTEDQIW DALERTHMKE CIAQLPLKLE 1320 

SEVMENGDNF SVGERQLLCI ARALLRHCKI LILDEATAAM DTETDLLIQE TIREAFADCT 1380 
MliT 1 AHRLHT VLGSDRIMVL AQGQWEFDT PSVLLSNDSS RFYAMFAAAE NKVAVKG 

t 

Seq ID NO: 195 DNA sequence 
Nucleic Acid Accession #: NM_0 0 6470 
Coding sequence: 2 2 8.. 192 2 



1 11 21 31 41 51 

I i 111) 

GCTGTCCTGA GCCTGAGTAC TCTAGCTGCC TTGTCGCCAT CGCATCTGGC TGCCATCCAG 60 

CGCCAGCACA CAGTAATGAG TGGCCGAGCT TCCTCTGGGA GGGAGGAAAC AGTTAAAATC 12 0 

TTGCAGCAGC TGCAATCATC TAGGCGTGGT TCTCTTGTCT GACTTGGGCT GCACAGATCC 180 

TGGGCCAAGG GACAGAAGAA AGACAGCCTA GGAGCAGAGC CTCCCAGATG GCTGAGTTGG 240 

ATCTAATGGC TCCAGGGCCA CTGCCCAGGG CCACTGCTCA GCCCCCAGCC CCTCTCAGCC 300 

CAGACTCTGG GTCACCCAGC CCAGATTCTG GGTCAGCCAG CCCAGTGGAA GAAGAGGACG 360 

TGGGCTCCTC GGAGAAGCTT GGCAGGGAGA CGGAGGAACA GGACAGCGAC TCTGCAGAGC 420 

AGGGGGATCC TGCTGGTGAG GGGAAAGAGG TCCTGTGTGA CTTCTGCCTT GATGACACCA 480 

GAAGAGTGAA GGCAGTGAAG TCCTGTCTAA CCTGCATGGT GAATTACTGT GAAGAGCACT 540 

TGCAGCCGCA TCAGGTGAAC AT C AAACTGC AAAGCCACCT GCTGACCGAG CCAGTGAAGG 600 

ACCACAACTG GCGATACTGC CCTGCCCACC ACAGCCCACT GTCTGCTTTC TGCTGCCCTG 660 

ATCAGCAGTG CATCTGCCAG GACTGTTGCC AGGAGCACAG TGGCCACACC ATAGTCTCCC 72 0 

TGGATGCAGC CCGCAGGGAC AAGGAGGCTG AACTCCAGTG CACCCAGTTA GACTTGGAGC 780 

GGAAACTCAA GTTGAATGAA AATGCCATCT CCAGGCTCCA GGCTAACCAA AAGT CTGTTC 840 

TGGTGTCGGT GTCAGAGGTC AAAGCGGTGG CTGAAATGCA GTTTGGGGAA CTCCTTGCTG 900 

CTGTGAGGAA GGCCCAGGCC AATGTGATGC TCTTCTTAGA GGAGAAGGAG CAAGCTGCGC 960 

TGAGCCAGGC CAACGGTATC AAGGCCCACC TGGAGTACAG GAGTGCCGAG ATGGAGAAGA 102 0 

GCAAGCAGGA GCTGGAGAGG ATGGCGGCCA TCAGCAACAC TGTCCAGTTC TTGGAGGAGT 1080 

ACTGCAAGTT TAAGAACACT G AAGACAT CA CCTTCCCTAG TGTTTACGTA GGGCTGAAGG 1140 

ATAAACT CTC GGGCATCCGC AAAGTTATCA CGGAATCCAC TGTACACTTA ATCCAGTTGC 12 0 0 

TGGAGAACTA TAAGAAAAAG CTCCAGGAGT TTTCCAAGGA AGAGGAGTAT GACATCAGAA 1260 

CTCAAGTGTC TGCCGTTGTT CAG CGCAAAT ATTGGACTTC CAAACCTGAG CCCAGCACCA 1320 

GGGAACAGTT CCTCCAATAT GCGTATGACA TCACGTTTGA CCCGGACACA GCACACAAGT 1380 

ATCTCCGGCT GCAGGAGGAG AACCG CAAGG TCACCAACAC CACGCCCTGG GAGCATCCCT 1440 

ACCCGGACCT CCCCAGCAGG TTCCTGCACT GGCGGCAGGT GCTGTCCCAG CAGAGTCTGT 1500 

ACCTGCACAG GTACTATTTT GAGGTGGAGA TCTTCGGGGC AGGCACCTAT GTTGGCCTGA 1560 

CCTGCAAAGG CATCGACCGG AAAGGGGAGG AGCGCAACAG TTGCATTTCC GGAAACAACT 1620 

TCTCCTGGAG CCTCCAATGG AACGGGAAGG AGTTCACGGC CTGGTACAGT GACATGGAGA 1680 

CCCCACTCAA AGCTGGCCCT TTCCGGAGGC TCGGGGTCTA TAT CGACTT C CCGGGAGGGA 1740 

TCCTTTCCTT CTATGGCGTA GAGTATGATA CCATGACTCT GGTTCACAAG TTTGCCTGCA 180 0 

AATTTTCAGA ACCAGTCTAT GCTGCCTTCT GGCTTTCCAA GAAGGAAAAC GCCATCCGGA 1860 

TTGTAGATCT GGGAGAGGAA CCCGAGAAGC CAGCACCGTC CTTGGGGGTG ACTGCTCCCT 1920 

AGACTCCAGG AGCCATATCC CAGACCTTTG CCAGCTACAG TGATGGGATT TGCATTTTAG 1980 

GGTGATTTGT GGGCAGAAAT AACTGCTGAT GGTAGCTGGC TTTTGAAATC CTATGGGGTC 2 040 

TCTGAATGAA AACATTCTCC AGCTGCTCTC TTTTGCTCCA TATGGTGCTG TTCTCTATGT 2100 

GTTTGCAGTA ATTCTTTTTT TTTTTTTTGA GACGGAGTCT CGCACTGTTG CCCAGGCTGG 2160 

AGAGCAGTGG CGCGAT CTTG GCTCACTGCA AGCTCCGCCT CCCGAGTTCA AGCAATTCTC 2220 

CTGCCTCAGC CTCCCGAGTA GCTGGGATTA CAGGTGCCTG CCACCACACC CAGCTAATGT 2280 

TTTGTATTTT TAGTAGAGAT GGGGTTTCAC CATGTTGGCC AGGCAGATCT CAAACT CCTG 2340 
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ACCTCGTGAT GCACCCACCT 
CGCCCTGCCT GTTTGTAGTA 
CTCCTCTCTG TTCAGGTAAA 
GAGTGGCTGA AAAGATTGCA 



CGGCCTCCCA AAGTGCTGGG 
ATTTTTAGGC ACCAAATCTC 
TGTCACACTG TGCCCAGAAT 
GAGTTATCAT AATAAATTGC 



ATTACATGCG TGAGCCACTG 
CCTCATCTTC TAGTGCCATT 
GGATGACCAG GAACCTTAAA 
TAACTTGCGT 



Seq ID NO: 196 Protein sequence: 
Protein Accession #: NP_006461 



I 

MAELDLMAPG 
DSAEQGDPAG 
EPVKDHNWRY 
LDLERKLKLN 
EQAALSQANG 
VGLKDKLSGI 
EPSTREQFLQ 
QQSLYLHRYY 
SDMETPLKAG 
NAIRIVDLGE 



11 
I 

PLPRATAQPP 
EGKEVLCDFC 
CPAHHSPLSA 
ENAISRLQAN 
I KAHLE YRSA 
RKVITESTVH 
YAYDITFDPD 
FEVEIFGAGT 
PFRRLGVYID 
EPEKPAPSLG 



21 

1 

APLSPDSGSP 
LDDTRRVKAV 
FCCPDQQCIC 
QKSVLVSVSE 
EMEKSKQELE 
LIQLLENYKK 
TAHKYLRLQE 
YVGLTCKGID 
FPGGILSFYG 
VTAP 



31 
I 

SPDSGSASPV 
KS CLTCMVN Y 
QDCCQEHSGH 
VKAVAEMQFG 
RMAAISNTVQ 
KLQEFSKEEE 
ENRKVTNTTP 
RKGEERNSCI 
VEYDTMTLVH 



41 



EEEDVGSSEK 
CEEHLQPHQV 
TIVSLDAARR 
ELLAAVRKAQ 
FLEEYCKFKN 
YDIRTQVSAV 
WEHPYPDLPS 
SGNNFSWSLQ 
KFACKFSEPV 



51 
I 

LGRETEEQDS 
NIKLQSHLLT 
DKEAELQCTQ 
ANVMLFLEEK 
TEDITFPSVY 
VQRKYWTSKP 
RFLHWRQVLS 
WNGKEFTAWY 
YAAFWLSKKE 



Seq ID NO: 197 DNA sequence 
Nucleic Acid Accession #: NM_004316 
Coding sequence: 433-1149 



CCCGAGACCC 
GCGCGTTCAG 
GCGCCAGCGG 
GGAGGAGGGG 
TTGCTCCCAC 
GCTCCCGCTT 
GTCCCCCTCG 
CCGCCGCTGC 
CAGCCGCAGC 
GCCGCGGCGG 
CAGCAGCAGC 
TCAGGGGGCG 
GAACTGATGC 
CAGCAGCCGG 
AACCTGGGCT 
AGTAAGGTGG 
GACGAGCATG 
CCCAACTACT 
GACGAGGGCT 
TGGTTCTGAG 
ATCGCACAAC 
AAAAGAAAAA 
CCAACCCCAT 
AGCGCTCAGA 
ACCTGAGTCA 
GAGCAGCACA 
GCTCGGGTCC 
GAGTTGGTGT 



11 
I 

GGCGCAAGAG 
CACTGACTTT 
CAGCCTCACA 
AGGGAGGAGG 
TCTAAGAAGT 
CATATTTCCT 
CGGGCCCCGC 
GCATGGAAAG 
CCCAGCAGCG 
CCGCAGCCGC 
AGCAGCAGCA 
GTCAC AAGT C 
GCTGCAAACG 
CCGCCGTGGC 
TTGCCACCCT 
AGACACTGCG 
ACGCGGTGAG 
CCAACGACTT 
CTTACGACCC 
GGGCTCGGCC 
CTGCATCTTT 
AAAAGAAGAA 
CGCCAACTAA 
ACAGTATCTT 
ATGCGCAAAA 
CGCGTTATAG 
CTTCACCTCC 
CTTTC 



21 
I 

AGCGCAGCCT 
TGCTGCTGCT 
CGCGAGCGCC 
AGGCGGCGTG 
CTCCCGGGGA 
TTTCTTTCCC 
ACCTCGCGTC 
CTCTGCCAAG 
CTTCCTGCCG 
CGCAGCGGCA 
GCAGGCGCCG 
AG CGCCCAAG 
CCGGCTCAAC 
GCGCCGCAAC 
TCGGGAGCAC 
CTCGGCGGTC 
CGCCGCCTTC 
GAACT CCATG 
GCTCAGCCCC 
TGGTCAGGCC 
AGTGCTTTCT 
GAAGAAGAAA 
GCGAGGCATG 
TGCACTCCAA 
TGCAGCTTGT 
TAACTCCCAT 
CCGCCCTTTC 



31 



TAGTAGGAGA 
TCTGCTTTTT 
ACGCGAGGCT 
CAGGGAGGAG 
TTTTGTATAT 
TCTCTGTTCC 
CCGGATCGCT 
ATGGAGAGCG 
CCCGCAGCCT 
GCGCAGAGCG 
CAGCTGAGAC 
CAAGTCAAGC 
TTCAGCGGCT 
GAGCGCGAGC 
GTCCCCAACG 
GAGTACATCC 
CAGGCAGGCG 
GCCGGCTCGC 
GAGGAGCAGG 
CTGGTGCGAA 
TGTCAGTGGC 
AGAGAAGAAG 
CCTGAGAGAC 
TCATTCACGG 
GTGCAAAAGC 
CACCTCTAAC 
TTAGAGTGCA 



41 
I 

GGAACGCGAG 
TTTTTCTTAG 
CCCGAAGCCA 
AAAAAGCATT 
ATTTTTTAAC 
TGCACCCAAG 
CTGATTCCGC 
GCGGCGCCGG 
GTTTCTTTGC 
CGCAGCAGCA 
CGGCGGCCGA 
GACAGCGCTC 
TTGGCTACAG 
GCAACCGCGT 
GCGCGGCCAA 
GCGCGCTGCA 
TCCTGTCGCC 
CGGTCTCATC 
AGCTTCTCGA 
TGGACTTTGG 
GTTGGGAGGG 
AAAAAAACGA 
ATGGCTTTCA 
AGATATGAAG 
AGTGGGCTCC 
ACGCACAGCT 
GTTCTTAGCC 



51 



ACGCGGCAGA 
AAACAAGAAG 
ACCCGCGAAG 
TTCACCTTTT 
TTCCGTCAGG 
TTCTCTCTGT 
GACTCCTTGG 
CCAGCAGCCC 
CACGGCCGCA 
GCAGCAGCAG 
CGGCCAGCCC 
GTCTTCGCCC 
CCTGCCGCAG 
CAAGTTGGTC 
CAAGAAGATG 
GCAGCTGCTG 
CACCATCTCC 
CTACTCGTCG 
CTTCACCAAC 
AAGCAGGGTG 
GGAGAAAAGG 
AAACAGTCAA 
GAAAACGGGA 
AGCAACTGGG 
TGGCAGAAGG 
GAAAGTT CTT 
CTCTAGAAAC 



Seq ID NO: 198 Protein sequence: 
Protein Accession #: NP_004307 

1 11 21 31 41 51 

I I I I I I 

MESSAKMESG GAGQQPQPQP QQPFLPPAAC FFATAAAAAA AAAAAAAQSA QQQQQQQQQQ 

QQQQAPQLRP AADGQPSGGG HKSAPKQVKR QRSSSPELMR CKRRLNFSGF GYSLPQQQPA 

AVARRNERER NRVKLVNLGF ATLREHVPNG AANKKMSKVE TLRSAVEYIR ALQQLLDEHD 

AVSAAFQAGV LSPTISPNYS NDLNSMAGSP VSSYSSDEGS YDPLSPEEQE LLDFTNWF 

Seq ID NO: 199 DNA sequence 
Nucleic Acid Accession #: NM_007015 
Coding sequence: 1-1005 

1 11 21 31 41 51 

I I I I I I 

ATGACAGAGA ACTCCGACAA AGTTCCCATT GCCCTGGTGG GACCTGATGA CGTGGAATTC 

TGCAGCCCCC CGGCGTACGC TACGCTGACG GTGAAGCCCT CCAGCCCCGC GCGGCTGCTC 

AAGGTGGGAG CCGTGGT CCT CATTTCGGGA GCTGTGCTGC TGCTCTTTGG GGCCAT CGGG 

GCCTTCTACT TCTGGAAGGG GAGCGACAGT CACATTTACA ATGTCCATTA CACCATGAGT 

ATCAATGGGA AACTACAAGA TGGGTCAATG GAAATAGACG CTGGGAA C AA CTTGGAGACC 

TTTAAAATGG GAAGTGGAGC TGAAGAAGCA ATTGCAGTTA ATGATTTCCA GAATGGCATC 

ACAGGAATTC GTTTTGCTGG AGGAGAGAAG TGCTACATTA AAGCGCAAGT GAAGGCTCGT 

ATTCCTGAGG TGGGCGCCGT GACCAAACAG AGCATCTCCT CCAAACTGGA AGGCAAGATC 

ATGCCAGTCA AATATGAAGA AAATTCTCTT ATCTGGGTGG CTGTAGATCA GCCTGTGAAG 

GACAACAGCT TCTTGAGTTC TAAGGTGTTA GAACT CTGCG GTGACCTTCC TATTTTCTGG 

CTTAAACCAA CCTATCCAAA AGAAATCCAG AGGGAAAGAA GAGAAGTGGT AAGAAAAATT 

GTTCCAACTA CCACAAAAAG ACCACACAGT GGACCACGGA GCAACCCAGG CGCTGGAAGA 

CTGAATAATG AAACCAGACC CAGTGTTCAA GAGGACTCAC AAGCCTTCAA TCCTGATAAT 



267 



WO 02/086443 

CCTTATCATC AGCAGGAAGG GGAAAGCATG 
ATCTGTTGTA TAGAATGTAG GCGGAGCTAC 
GGGGGCTATT ACCCATGGCC TTATAATTAT 
ATGCCATGTA GCTGGTGGGT GGCCCGTATC 
CACGTGCTGT AAAATAAGAA CTAGCTGAAG 
ATGCTGATGG GACCATAAAA TATTTTTACA 
TAACAGAATT TTTTTAATCG TTTTCCAGAA 
AGTTCAAGTC TAAAATGCCA TAACCCCGTT 
CATAAGTCTT CCCTTGCTTG CATCTTCCAA 
AGTTTGCC 



ACATTCGACC CTAGACTGGA TCACGAAGGA 840 

ACCCACTGCC AGAAGATCTG TGAACCCCTG 900 

CAAGGCTGCC GTTCGGCCTG CAGAGTCATC 960 

TTGGGCATGG TGTGAAATCA CTT CAT AT AT 1020 

AGACAAC CAA AGAAGCATTA AGGCAGGTTG 1080 

CGCAGCCTGA GCGGTTATTC TTGACACTCT 1140 

CTTTAGTATA TGCAAATGCA CTGAAAGGGT 1200 

ATTTGTTATT TTTTATTTGC ATTGATTTGC 12 60 

AGCTATTTCG AAATAAACAC GAAAATTTAC 132 0 



Seq ID NO: 200 Protein sequence: 
Protein Accession #: NP_008946 



11 



21 



MTENSDKVPI 
AFYFWKGSDS 
TGIRFAGGEK 
DNSFLSSKVL 
LNNETRPSVQ 
GGYYPWPYNY 



ALVGPDDVEF 
HIYNVHYTMS 
CYIKAQVKAR 
ELCGDLPIFW 
EDSQAFNPDN 
QGCRSACRVI 



CSPPAYATLT 
INGKLQDGSM 
IPEVGAVTKQ 
LKPTYPKEIQ 
PYHQQEGESM 
MPCSWWVARI 



31 

] 

VKPSSPARLL 
EIDAGNNLET 
SISSKLEGKI 
RERREWRKI 
TFDPRLDHEG 
LGMV 



41 
I 

KVGAWLISG 
FKMGSGAEEA 
MPVKYEENSL 
VPTTTKRPHS 
ICCIECRRSY 



51 



AVLLLFGAIG 
IAVNDFQNGI 
IWVAVDQPVK 
GPRSNPGAGR 
THCQKICEPL 



Seq ID NO: 201 DNA sequence 

Nucleic Acid Accession ft: NM_00 0728.2 

Coding sequence : 112.. 495 



GTAATAAGAG 

GTCGACCGGC 

CGGAAGTTCT 

CAGGCGGCGC 

GAGGACGCGC 

GAG CTGAAG C 

AACACTGCCA 

GTGAAGAGCA 

GACCTTCAAG 

CATATCCTTA 

AAGGAGGCAC 

TGGAAGAAGA 

GAGAATAATT 

GGAAACTAAT 

GGTTATTTGG 

ACTGTACCAC 

GTATGTAGCA 

AGCATCTATT 

AAATTTTTGT 

TGGATGCAAG 

TTGCTTTTTC 

TCCAATTCAT 

TTGCCTAACT 

TATAGTTTTA 

TGAGAGGTGT 

TTTGTTAAAA 

CTGATCATAT 

ACCATTCTTT 

ACCAGATAAT 

CTAAAATATT 

TTCTGATGAG 

CATATTAATA 

GTTTTCTCTG 

ATATCTTGTT 

ATTTTTGTTT 

AAAAAAAAAA 



11 

I 

CGGGGTCTCC 

CGCTCGCGCT 

CCCCCTTCCT 

CATTCAGGTC 

GCCTCCTGCT 

AGGAGCAGGA 

CCTGTGTGAC 

ACTTCGTGCC 

CCTGAGCAGA 

TAAGAGATTC 

AAGCCAAGGA 

GCAGCCCTGC 

TCTGTTGTTT 

ACAATACATT 

AAAGTGTGTA 

TTCGCCTTCT 

GTATCTCATT 

TTACCATATG 

TGGCTTGCTT 

ATTGTTTTCA 

ATTTTCTTAG 

CTTTTTTTTT 

AAGGTCCCAA 

TATTTTATAT 

AGGTTGAAAT 

AGACTGTTAT 

TTGTGTGGGT 

TGCCAATGTC 

GTGGGTCTAC 

TTCTACATCT 

ATTTTTAATG 

AT AT TAAGTC 

TTTTTTTTTT 

AGATTTTTAA 

TTAATTGTTC 

AAAAAAAAAA 



21 
i 

GCGGGGAAGG 

GCCCTGAAAC 

GGCTCTCAGT 

TGCCCTGGAG 

GGCTGCACTG 

GACACAGGGC 

TCATCGGCTG 

CACCAATGTG 

TGAATGACTC 

ACTCAGAAGA 

AGTCTGTGTC 

TGACACCTAG 

TAAGCCACAA 

TTCATTTATT 

TTTAACTCTG 

TGCCAGCCAC 

GCTGTTTTAA 

TTTATCACCT 

GCTTTATTAG 

GATATATAGT 

CAGTGTCTCT 

CTTTTATGTA 

GGTCACAATA 

GTAGATTAGT 

T C AT ACCTGT 

TTCACCATTT 

ATATTTCTGG 

ATACTGCCTT 

CAACATTGTT 

TTTATACATT 

GGATTGTGTT 

GTTCAATTCA 

TTTAACAGTG 

CTATTTTATT 

ATTGCTAGTA 

AAAAAAAAAA 



31 



CGCCCACAGC 

TCTAGTCGCC 

ATCTTGGTCC 

AGCAGCCCAG 

GTGCAGGACT 

TCCAGCTCCG 

GCAGGCTTGC 

GGTT CCAAAG 

CAGGAAGAAG 

CACATGTGGA 

TACCAGAAGC 

AGTTTGGACT 

AGTTTGTGGT 

TTGGGTAAAT 

TAAGAAACTG 

ATATGAGAGC 

TTTGTATTTC 

TTATTGAAGG 

TGTTGAGTTT 

TTGGAAACTT 

CACAGAGAAA 

TTGTGCTTTT 

ACCTTATTCT 

GATCTATTTT 

GAATATAGAT 

AATTGCCCCT 

GTTCTCAATT 

GATTAGTGTA 

CATTCTTGTT 

TTAGAATCAG 

AAATCAGTGG 

TGAACACAAT 

TTCTCAGTTT 

TTTTGGTGCT 

GATAGAAATA 



41 
) 

AGGTGTGGTG 

AGAGAGGCGG 

TGTACCAGGC 

ACCCGGCCAC 

ATGTGCAGAT 

CTGCCCAGAA 

TGAGCAGATC 

CCTTTGGCAG 

GTGTGTCCTA 

GAAGGTGACA 

CAGAATCACA 

TCCAGCTTCC 

AATTTGTTAT 

GCCTTGGAGT 

CCAAACTATT 

TCTAGTATTT 

CCCAATGACT 

GTCTGTTTAA 

TTAGAGCTCT 

CCTTCCCCTG 

AAGTTGTAAT 

AGTTCATGTC 

ATACTTTCTT 

GAGTTAATTT 

ACCCAATTGT 

GCACCTTTGT 

CTGTCTCATT 

GTGTTAAAGT 

CAAAAAGATT 

TGTGTTACTA 

GTTAATTTTG 

ACATGTTTTC 

TCAACAGAAA 

AATGTAAATG 

CAATATTTAA 



51 
I 

TTCATCCCGG 

CATGGGTTTC 

GGGCAGCCTC 

ACTCAGTAAA 

GAAGGCCAGT 

GAGAGCCTGC 

AGGGGGCATG 

GCGCCGCAGG 

AATCCAATGA 

TGACAGAGGC 

GAACAGTCTC 

AGAACTGTGA 

GACAGCCCTA 

GGGATTGCTG 

TTCTGAAGTG 

CCACAAATAG 

AATGACGTTG 

ATCTTCTGCT 

TTATATGTTG 

AATCTGCGGA 

TTGAATAAGA 

TAAGAACTCT 

GTAAAAGTTT 

TTGTATAAGG 

TTCAGTGCCA 

CAAAAAGCAA 

GATTGATTTG 

GAAT CTCAAA 

TTAGCTACAT 

TCTACAAAAT 

GGAGAATTAG 

ACTTATTTAG 

TATTCTACAC 

GTACTTAAAC 

AATATTAGGA 



Seq ID NO: 202 Protein sequence: 
Protein Accession #: NP_000719.1 



11 



41 



51 



60 
120 
180 
240 
300 



60 
120 
180 
240 
300 
360 
42 0 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 



21 31 

1 1 I I I I 

MGFRKFSPFL ALSILVLYQA GSLQAAPFRS ALE S S PD PAT LSKEDARLLL AALVQDYVQM 
KASELKQEQE TQGSSSAAQK RACNTATCVT HRLAGLLSRS GGMVKSNFVP TNVGSKAFGR 
RRRDLQA 

Seq ID NO: 203 DNA sequence 
Nucleic Acid Accession #: NM_0 01741 
Coding sequence: 71.. 4 96 



60 
120 



CTCTGGCTGG 
GAGAGGTGTC 
GTTGCAGGCA 
AGACCCGGCC 
CTATGTGCAG 



11 
1 

ACGCCGCCGC 
ATGGGCTTCC 
GGCAGCCTCC 
ACGCT CAGTG 
ATGAAGGCCA 



21 

I 

CGCCGCTGCC 
AAAAGTTCTC 
ATGCAGCACC 
AGGACGAAGC 
GTGAGCTGGA 



31 



41 



ACCGCCTCTG 
CCCCTTCCTG 
ATTCAGGTCT 
GCGCCTCCTG 
GCAGGAGCAA 



ATCCAAGCCA 
GCTCTCAGCA 
GCCCTGGAGA 
CTGGCTGCAC 
GAGAGAGAGG 



51 
I 

CCTCCCGCCA 
TCTTGGTCCT 
GCAGCCCAGC 
TGGTGCAGGA 
GCTCCAGCCT 



60 
120 
180 
240 
300 



268 
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GGACAGCCCC AGATCTAAGC GGTGCGGTAA TCTGAGTACT TGCATGCTGG GCACATACAC 
GCAGGACTTC AACAAGTTTC ACACGTTCCC CCAAACTGCA ATTGGGGTTG GAGCACCTGG 
AAAGAAAAGG GATATGTCCA GCGACTTGGA GAGAGACCAT CGCCCTCATG TTAGCATGCC 
CCAGAATGCC AACTAAACTC CTCCCTTTCC TTCCTAATTT CCCTTCTTGC ATCCTTCCTA 
TAACTTGATG CATGTGGTTT GGTTCCTCTC TGGTGGCTCT TTGGGCTGGT ATTGGTGGCT 
TTCCTTGTGG CAGAGGATGT CTCAAACTTC AGATGGGAGG AAAGAGAGCA GGACT CACAG 
GT TGGAAGAG AATCACCTGG GAAAATACCA GAAAATGAGG GCCGCTTTGA GTCCCCCAGA 
GATGTCATCA GAGCTCCTCT GTCCTGCTTC TGAATGTGCT GATCATTTGA GGAATAAAAT 
TATTTTTCCC C 



Seq ID NO: 204 Protein sequence: 
Protein Accession #: NP_001732 

1 11 21 31 41 51 

I I I.I I I 

MGFQKFSPFL ALSILVLLQA GSLHAAPFRS ALESSPADPA TLSEDEARLL LAALVQDYVQ 

MKASELEQEQ EREGSSLDSP RSKRCGNLST CMLGTYTQDF NKFHTFPQTA IGVGAPGKKR 

DMSSDLERDH RPHVSMPQNA N 

Seq ID NO: 205 DNA sequence 
Nucleic Acid Accession #: NM_005361 
Coding sequence: 1-945 

1 11 21 31 41 51 

I I I I I I 

ATGCCT CTTG AGCAGAGGAG TCAGCACTGC AAGCCTGAAG AAGGCCTTGA GGCCCGAGGA 

GAGGCCCTGG GCCTGGTGGG TGCGCAGGCT CCTGCTACTG AGGAGCAGCA GACCGCTTCT 

TCCTCTTCTA CTCTAGTGGA AGTTACCCTG GGGGAGGTGC CTGCTGCCGA CTCACCGAGT 

CCTCCCCACA GTCCTCAGGG AGCCTCCAGC TTCTCGACTA CCATCAACTA CACTCTTTGG 

AGACAATCCG ATGAGGGCTC CAGCAACCAA GAAGAGGAGG GGCCAAGAAT GTTTCCCGAC 

CTGGAGTCCG AGTTCCAAGC AGCAATCAGT AGGAAGATGG TTGAGTTGGT TCATTTTCTG 

CTCCTCAAGT ATCGAGCCAG GGAGCCGGTC ACAAAGGCAG AAATGCTGGA GAGTGTCCTC 

AGAAATTGCC AGGACTTCTT TCCCGTGATC TTCAGCAAAG CCTCCGAGTA CTTGCAGCTG 

GTCTTTGGCA TCGAGGTGGT GG AAGTGGT C CCCATCAGCC ACTTGTACAT CCTTGTCACC 

TGCCTGGGCC TCTCCTACGA TGGCCTGCTG GGCGACAATC AGGTCATGCC CAAGACAGGC 

CTCCTGATAA TCGTCCTGGC CATAAT CGCA ATAGAGGGCG ACTGTGCCCC TGAGGAGAAA 

ATCTGGGAGG AG CTGAGTAT GTTGGAGGTG TTTGAGGGGA GGGAGGACAG TGTCTTCGCA 

CATCCCAGGA AGCTGCTCAT GCAAGATCTG GTGCAGGAAA ACTACCTGGA GTACCGGCAG 

GTGCCCGGCA GTGATCCTGC ATGCTACGAG TTCCTGTGGG GTCCAAGGGC CCTCATTGAA 

ACCAGCTATG TGAAAGTCCT GCACCATACA CTAAAGATCG GTGGAGAACC TCACATTTCC 

TACCCACCCC TGCATGAACG GGCTTTGAGA GAGGGAGAAG AGTGA 

Seq ID NO: 206 Protein sequence: 
Protein Accession #: NP_005352 

1 11 21 31 41 51 

1 I I I I I 

MPLEQRSQHC KPEEGLEARG EALGLVGAQA PATEEQQTAS SSSTLVEVTL GEVPAADSPS 

PPHSPQGASS FSTTINYTLW RQSDEGSSNQ EEEGPRMFPD LESEFQAAIS RKMVELVHFL 

LLKYRAREPV TKAEMLESVL RNCQDFFPVI FSKASEYLQL VFGIEWEW PISHLYILVT 

CLGLSYDGkL GDNQVMPKTG LLIIVLAIIA IEGDCAPEEK IWEELSMLEV FEGREDSVFA 

HPRKLLMQDL VQENYLEYRQ VPGSDPACYE FLWGPRALIE TSYVKVLHHT LKIGGEPHIS 

YPPLHERALR EGEE 

Seq ID NO: 207 DNA sequence 
Nucleic Acid Accession #: NM_021115 
Coding sequence: 743-2893 

1 11 21 31 41 51 

! I I 1 I I 

AAAGGAAGGG AGGGAGGGAG AAAGGAGAAG TTGGTTTAGA GGCCAGCCGG ACGAGCTTTG 
GGCACCGCCC TTAGGAGGGC CACCCTCAGA GTCTGACAGC AGGTGAAGGT CCTAAATCTC 
CCCAAACTAA CTGGTGTCTT TTCTCCTCTT CCAAGATGCT CTTCCCGAGG GAGATGCTAG 
CCCTTTGGGT CCTTACCTCC TGCCCTCAGG AGCCCCGGAG AGAGGCAGTC CTGGCAAAGA 
GCACCCTGAA GAGAGAGTGG TAACAGCGCC CCCCAGTTCC TCACAGTCGG CGGAAGTGCT 
GGGCGAGCTG GTGCTGGATG GGACCGCACC CTCTGCACAT CACGACATCC CAGCCCTGTC 
ACCGCTGCTT CCAGAGGAGG CCCGCCCCAA GCACGCCTTG CCCCCCAAGA AGAAACTGCC 
TTCGCTCAAG CAGGTGAACT CTGCCAGGAA GCAGCTGAGG CCCAAGGCCA CCTCCGCAGC 
CACTGTCCAA AGGGCAGGGT CCCAGCCAGC GTCCCAGGGC CTAGATCTCC TCTCCTCCTC 
CACGGAGAAG CCTGGCCCAC CGGGGGACCC GGACCCCATC GTGGCCTCCG AGGAGGCATC 
AGAAGTGCCC CTTTGGCTGG ACCGAAAGGA GAGTGCGGTC CCTACAACAC CCGCACCCCT 
GCAAATCTCC CCCTTCACTT CGCAGCCCTA TGTGGCCCAC ACACTCCCCC AGAGGCCAGA 
ACCCGGGGAG CCTGGGCCTG ACATGGCCCA GGAGGCCCCC CAGGAGGACA CCAGCCCCAT 
GGCCCTGATG GACAAAGGTG AGAATGAGCT GACTGGGTCA GCCTCAGAGG AGAGCCAGGA 
GACCACTACC TCCACCATTA TCACCACCAC GGTCATCACC ACCGAGCAGG CACCAGCTCT 
CTGCAGTGTG AGCTTCTCCA ATCCTGAGGG GTACATTGAC TCCAGCGACT ACCCACTGCT 
GCCCCTCAAC AACTTTCTGG AGTG CACAT A CAACGTGACA GTCTACACTG GCTATGGGGT 
GG AG C T C C AG GTGAAGAGTG TGAACCTGTC CGATGGGGAA CTGCTCTCCA TCCGCGGGGT 
GGACGGCCCT ACCCTGACCG TCCTGGCCAA CCAGACACTC CTGGTGGAGG GGCAGGTAAT 
CCGAAGCCCC ACCAACACCA TCTCCGTCTA CTTCCGGACC TTCCAGGACG ACGGCCTTGG 
GACCTTCCAG CTTCACTACC AGGCCTTCAT GCTGAGCTGC AACTTTCCCC GCCGGCCTGA 
CTCTGGGGAT GTCACGGTGA TGGACCTGCA CTCAGGTGGG GTGGCCCACT TTCACTGCCA 
CCTGGGCTAT GAGCTCCAGG GCGCTAAGAT GCTGACATGC ATCAATGCCT CCAAGCCGCA 
CTGGAGCAGC CAGGAGCCCA TCTGCTCAGC TCCTTGTGGA GGGGCAGTGC ACAATGCCAC 
CATCGGCCGC GTCCTCTCCC CAAGTTACCC TGAAAACACA AATGGGAGCC AATTCTGCAT 
CTGGACGATT GAAGCTCCAG AGGGCCAGAA GCTGCACCTG CACTTTGAGA GGCTGTTGCT 



269 



10 



15 



20 



25 



WO 02/086443 

GCATGACAAG GACAGGATGA 

CGACTCCCTT CAAACCGAGA 

CCGCATCGAG TTCACGTCCG 

AGCGTTTGAG AAAGGCCACT 

CGACCCGACC TATAACATTG 

GGAGCAGGGC CCGGCCATCA 

AGAGCCCCTG TGCAGAGCCA 

GTCCCCAAAC TGGCCCGAGC 

GGGAGAAGAG AAACGGATCT 

CTTGACCATC TACGATGGCG 

CAGTGGCCCC CAGAAACTGT 

CCCTGCTGGC CTCATCTTTG 

AAGGAATGAC TCCTGCTCGG 

CACGGAGTTG GTGCGGGGAG 

GGGGAGTGAC ACCCTCACCT 

TGAGAAAATT ATGTACTGCA 

GGATCCTGTG CTGCTGGTGG 

TGAAGGGAGT TCTCTTCTGA 

TCGCCTGCCC CACTGCGTTT 

GGCCCTGGCT AT CTT CAT CC 
TTACATCACA AGATGTCGCT 

CTACAGCCAG ATCACCGTGG 

CCAAAAGGTT TAGGGTTTCA 

AACCCCAATT TCCCCGAGAC 

AAAGGCGGCT GTTTTTTGGT 
TTTATAAATT TTAAAAGTG 



CGGTTCACAG 
GTGTCCCTTT 
ACCAGGCCCG 
GCTATGAGCC 
GGACTATAGT 
TCGAATGCAT 
TGTGTGGTGG 
CCTACGTGGA 
TCTTAGATAT 
ACGAGGT CAT 
ACTCCTCCAC 
GAAAGGGCCA 
ATTTACCCGA 
CCAGAATCAC 
GCCAGTGGGA 
CCGACCCCGG 
GGACCACCAT 
CCTGCTACAG 
CAGAAGCGGC 
CGGTCCTCAT 
ACTATTCCAA 
AAACCGAGTT 
TTTAAAAAGA 
ATTT AT CCAA 
TAAACTTTTT 



CGGGCAGACC 
TGAGGGCCTG 
GGCGGCCTCC 
CTACATCCAG 
GGAGTT CACC 
CAATGTGCGG 
GGAGCTCTCT 
AGGTGAAGAT 
CCAGTTCCTG 
GCCCCACATC 
GCCAGACTTA 
GGGATTTATC 
GAT CCAGAAT 
CTACCAGTGT 
CCTCAGCTGG 
AGAGGTGGAT 
CCAATACACC 
CCGTGAAACA 
AGCAGAGACG 
CATCTCCTTA 
CCTCCGCCTG 
TGACAACCCC 
GGTACCCTTT 
AGGCCCTGGG 
AACAAAGGGT 



AACAAGTCAG 
CTGAGCGAAG 
ACCTTCAACA 
AATGGGAACT 
TGCGACCCCG 
GACCCATACT 
GCTGTGGCTG 
TGTATCTGGA 
AATCTGAGCA 
TTGGGGCAGT 
ACCATCCAGT 
ATGAACTACA 
GGCTGGAAAA 
GACCCCGGCT 
AGCAGCGACC 
CACTCGACCC 
TGCAACCCCG 
GGGACTCCCA 
TCGCTGGAAG 
CTGCTGGGAG 
CCTCTGATGT 
ATTTACGAGA 
AAAAAGGGGC 
GGCCTTGATT 
TACGGGTTTT 



CTCTTCTCTA 1620 

G CAA CAC CAT 1680 

TCCGATTTGA 1740 

TCACTACATC 1800 

GCCACTCCCT 1860 

GGAAT GACAC 192 0 

GGGTGGT AT T 1980 

AGATCCACGT 2 040 

ACAGTGA CAT 2100 

ACCTTGGGAA 2160 

TCCATT CGGA 222 0 

TAGAGGTATC 22 8 0 

CCACTTCTCA 2340 

ATGACATCGT 2400 

CCCCATTTTG 2460 

GCTTAATTTC 252 0 

GTTTTGTGCT 2580 

TCTGGACGTC 2 640 

GGGGGAACAT 2700 

GAGCCTACAT 2760 

ACTCCCACCC 2 82 0 

CAGGGGGAAC 2 880 

TTGTGAACTC 2 940 

TAAACCCCCA 3000 

TTCCCCGGAT 3 060 



PCT/US02/12476 



Seq ID NO: 208 Protein sequence: 
30 Protein Accession #: NP 066938 



35 



40 



45 



MAQEAPQEDT 
PEGYIDSSDY 
LANQTLLVEG 
DLHSGGVAHF 
SYPENTNGSQ 
VPFEGLLSEG 
TIVEFTCDPG 
YVEGEDCIWK 
SSTPDLTIQF 
RITYQCDPGY 
TTIQYTCNPG 
VIiIISLLLGG 



11 
I 

SPMALMDKGE 
PLLPLNNFLE 
QVIRSPTNTI 
HCHLGYELQG 
FCIWTIEAPE 
NTIRIEFTSD 
HSIiEQGPAII 
IHVGEEKRIF 
HSDPAGLIFG 
D I VGSDTLTC 
FVLEGSSLLT 
AYIYITRCRY 



21 



31 



41 



51 



NELTGSASEE 
CTYNVTVYTG 
SVYFRTFQDD 
AKMLTCINAS 
GQKLHLHFER 
Q ARAASTFN I 
ECINVRDPYW 
LDIQFLNLSN 
KGQGFIMNYI 
QWDLSWSSDP 
CYSRETGTP I 
YSNLRLPLMY 



SQETTTSTII 
YGVELQVKSV 
GLGTFQLHYQ 
KPHWSSQEPI 
LLLHDKDRMT 
RFEAFEKGHC 
NDTEPLCRAM 
SDILTIYDGD 
EVSRNDSCSD 
PFCEKIMYCT 
WTSRLPHCVS 
SHPYSQITVE 



TTTVITTEQA 
NLSDGELLSI 
AFMLSCNFPR 
CSAPCGGAVH 
VHSGQTNKSA 
YEPYIQNGNF 
CGGELSAVAG 
EVMPHILGQY 
LPEIQNGWKT 
DPGEVDHSTR 
EAAAETSLEG 
TEFDNPIYET 



PALCSVSFSN 60 

RGVDGPTLTV 120 

RPDSGDVTVM 180 

NATIGRVLSP 240 

LLYDSLQTES 300 

TTSDPTYNIG 360 

WLSPNWPEP 42 0 

LGNSGPQKLY 480 

TSHTELVRGA 540 

LISDPVLLVG 600 

GNMALAIFIP 660 
GGTQKV 



50 



55 



60 



Seq ID NO: 209 DNA sequence 

Nucleic Acid Accession #: NM_001327.1 

Coding sequence: 89-631 



65 



AG CAGGGGGC 
CTGAGAGCCG 
GACGGGCGAT 
TGGCGGCCCA 
AAGGGCCTCG 
GCTGAATGGA 
CCTCGCCATG 
GGATG CCCCA 
CATACTGACT 
CTGTCTCCAG 
GGCTCAGCCT 
GCCTCCTCCC 
GTTTGTCGCT 



11 

I 

GCTGTGTGTA 
GGCAGAGGCT 
GCTGATGGCC 
GGAGAGGCGG 
GGGCCGGGAG 
TGCTGCAGAT 
CCTTTCGCGA 
CCGCTTCCCG 
ATCCGACTGA 
CAGCTTTCCC 
CCCTCAGGGC 
CTAGGGAATG 
GGAGGAGGAC 



21 

I 

CCGAGAATAC 
CCGGAGCCAT 
CAGGAGGCCC 
GTGCCACGGG 
GAGGCGCCCC 
GCGGGGCCAG 
CACCCATGGA 
TGCCAGGGGT 
CTGCTGCAGA 
TGTTGATGTG 
AGAGGCGCTA 
GTCCCAGCAC 
GGCTTACATG 



31 

I 

GAGAATACCT 
GCAGGCCGAA 
TGGCATTCCT 
CGGCAGAGGT 
GCGGGGTCCG 
GGGGCCGGAG 
AGCAGAGCTG 
GCTTCTGAAG 
CCACCGCCAA 
GAT CACGCAG 
AGCCCAGCCT 
GAGTGGCCAG 
TTTGTTTCTG 



41 
I 

CGTGGGCCCT 
GGCCGGGGCA 
GATGGCCCAG 
CCCCGGGGCG 
CATGGCGGCG 
AGCCGCCTGC 
GCCCGCAGGA 
GAGTTCACTG 
CTGCAGCTCT 
TGCTTTCTGC 
GGCGCCCCTT 
TTCATTGTGG 
TAGAAAATAA 



51 

I 

GACCTTCTCT 60 

CAGGGGGTTC 120 

GGGGCAATGC 180 

CAGGGGCAGC 240 

CGGCTTCAGG 300 

TTGAGTTCTA 360 

GCCTGGCCCA 420 

TGTCCGGCAA 4 80 

CCATCAGCTC 540 

CCGTGTTTTT 60 0 

CCTAGGTCAT 660 

GGGCCTGATT 72 0 
AACTGAGCTA 



70 



75 



Seq ID NO: 210 Protein sequence: 
Protein Accession #: NP_001318.1 



11 



21 31 41 51 

I 1 I I I I 

MQAEGRGTGG STGDADGPGG PG I PDGPGGN AGGPGEAGAT GGRGPRGAGA ARASGPGGGA 
PRGPHGGAAS GLNGCCRCGA RGPESR1.I.EF YL AMP FAT PM EAELARRSLA QDAPPLPVPG 
VLLKEFTVSG NILTIRLTAA DHRQLQLS I S SCLQQLSLLM WITQCFLPVF LAQPPSGQRR 



60 
120 



80 



85 



Seq ID NO: 211 DNA sequence 
Nucleic Acid Accession #: Eos 
Coding sequence: 52-459 



sequence 



CCTCGTGGGC 
GAAGGCCAGG 
CCTGATGGCC 
GGTCCCCGGG 
CCGCATGGCG 



11 

i 

CCTGACCTTC 
GCACAGGGGG 
CAGGGGGCAA 
GCGCAGGGGC 
GTGCCGCTTC 



21 
I 

TCTCTGAGAG 
TTCGACGGGC 
TGCTGGCGGC 
AGCAAGGGCC 
TGCGCAGGAT 



31 
I 

CCGGG CAG AG 
GATGCTGATG 
CCAGGAGAGG 
TCGGGGCCGA 
GGAAGGTGCC 



41 
I 

GCTCCGGAGC 
GCCCAGGAGG 
CGGGTGCCAC 
GAGGAGGCGC 
CCTGCGGGGC 



51 
I 

CATGCAGGCC 60 

CCCTGGCATT 120 

GGGCGGCAGA 180 

CCCGCGGGGT 240 

CAGGAGGCCG 300 



270 



WO 02/086443 

GACAGCCGCC TGCTTCAGTT 

ATCAGCTCCT GTCTCCAGCA 

GTGTTTTTGG CTCAGGCTCC 

TAGGTCATGC CTCCTCCCCT 

GCCTGATTGT TTGTCGCTGG 
CTGAGCTA 



PCT/US02/12476 



CCGACTGACT 
GCTTTCCCTG 
CTCAGGGCAG 
AGGGAATGGT 
AGGAGGACGG 



GCTGCAGACC 
TTGATGTGGA 
AGGCGCTAAG 
CCCAGCACGA 
CTTACATGTT 



ACCGCCAACT 
TCACGCAGTG 
CCCAGCCTGG 
GTGGCCAGTT 
TGTTTCTGTA 



GCAGCTCTCC 360 

CTTTCTGCCC 420 

CGCCCCTTCC 480 

CATTGTGGGG 540 

GAAAATAAAG 60 0 



10 



Seq ID NO: 212 Protein sequence: 
Protein Accession #: Eos sequence 
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41 

I I 1 I I 

MQAEGQGTGG STGDADGPGG PGIPDGPGGN AGGPGEAGAT GGRGPRGAGA ARASGPRGGA 

PRGPHGGAAS AQDGRCPCGA RRPDSRLLQF RLTAADHRQL QLSISSCLQQ LSLLMWITQC 

FLPVFLAQAP SGQRR 

Seq ID NO: 213 DNA sequence 
Nucleic Acid Accession #: NM_0005S5 
Coding sequence: 416.. 1498 



85 



CTTATTTTTT 
AG CACAAAG A 
TCTGGGGGGA 
ACTCCCCCTT 
AACCTTGGGT 
TACAACTGTT 
CCCGAAGTTC 
ACTTGATTTT 
GATGAATGGG 
CTTGCAGGCA 
CCGCTACTTC 
CTTGCTGGCT 
TTACATTTAC 
GGAAAGCTAT 
CAATCCCAAC 
GGCTAGCAGC 
TACCAT CAT C 
GACAGCCCAC 
CGGGGTTGTC 
CTTTGGTGAT 
TGATTTTTCT 
TGGCCCAAAG 
CCGAAGCAAG 
CAAGTCTAAG 
GGACCTGTAC 
GAGGGGAGAG 
TCTGCTCAAG 
TATTTTGAAA 
CACTGATCCA 
TCCAGGGATG 
TAAATTTGCC 
ATACAGCAAT 
ACAAACACAA 
GCAAGGCAGC 
CACCAATTCT 
TGCTTAGGAT 
ACATTTCCGA 
TTTGGAATCA 
TCTAGAAGGC 
TGTTCTATTG 
GGT CTGACAC 
CATGTCTGTA 
TTTTGTCTAA 
ATGTTATTTA 
AATAGCAGAG 
CATTAATAAT 
ATATTTTAAG 
CTTTCACTTG 
TAGTTTT CAG 
GCCCATAATG 
GCTTTNACCA 
CACAGCATCC 
CTAAATGGAA 
GTGTGTGTGT 
GTAATGGATT 
GTGGTGGTGG 
ACATTTTCGG 
ACCCCAAATG 
CCATTAATAA 
GTGCCTCCCA 
GGGCATAAAG 
CACCCATAGT 
TGGAGGCTGG 
ACACTAGCTC 
GGATATATTT 



11 

ATGAATGTCG 
CACTGGCTGT 
GGGGATGCAC 
CATAGTCATT 
AGCTCCTTCT 
AGTCATGTGG 
CAATTTGATA 
GGACACTTTG 
TTGCCTAGCC 
CTGAGTAATG 
AAGGGGATTG 
GACCTGACGC 
ACCATTGATG 
GTCTGTTCCT 
TGGTCTGTCA 
AACAGTGCAC 
CGCAGTGGGG 
TCTTTTGAGC 
AAAAAACTCT 
GATGATGTGT 
CTGGATGAAA 
GCATCCCCAA 
TCTCCAGCTG 
CAGTCTCCCA 
CTGCCTCTGT 
TGCTCAGAGT 
TGTCCAACAG 
AACACATTGT 
CAGTTACCAA 
CAAAATGTGC 
CCGTTTAAAT 
TAAAAAGTTT 
GTGCCCCTTT 
TCCCCAGCCT 
GGCTGTCAAT 
CCTGGTGCTG 
AGAGTTTATA 
ATAAGCAATT 
TGTCTAACAT 
AATGCCTTGT 
CTTTCAGTCT 
TTTCAGGAGC 
AAAACACATG 
GAAATTATGC 
GCCAATTCAA 
TTCAATGTGG 
CAACTCTTTT 
TCTTTAACAT 
TCTTTTGAGA 
GCAAAAACAA 
AATATAAAAA 
AAACCAAGCT 
TGAGCTTGCT 
GTGTGCATCT 
GGTGGCAACT 
GGTATCTCAA 
TTCAAGAAAA 
ATGAGGATCT 
GCCCATTTTA 
NAACATTTTG 
AATGGTGGGA 
NTCACTTTAG 
TAAAGAGCAG 
TNTGAGTATT 
T CTTTAGG AT 



21 



GATAGCTGCA 
TCCCTGGAGG 
ACATTAGAGT 
GTACTGAAAT 
GTTCTCTTCA 
GCATGTGTGA 
GGAGCCACTG 
ACGAAAGAGA 
CCACTCACAG 
AGAAGAAAGC 
TGTACGCTGT 
GATCTCTGTC 
GATCCAGGAA 
CAGACAACTT 
ACGTAAAAAC 
AGGCCAGGGA 
TGAAGCCTCG 
AAGTCCTCAC 
ACACTCTGGA 
TTATTGCCTG 
ATGAATGCCG 
CACCTCAGAA 
ACTCAGCAAA 
TCTCTACGCC 
CCTTGGATGA 
CCAGAGTACA 
GGCTATTGGT 
AATATGTTGG 
TTATGAGAGA 
TAGT CCATGA 
TTGCCCAAAC 
GTGTGGGGAA 
TCTCTGGATC 
CACTCTTCAC 
GGGGAGAAAT 
GGTTAGCTAA 
AAGCACAGTG 
GATAATAGTT 
ACCACATGAT 
TAACAG CCAA 
CTTTTTATAG 
AAACTCTTCA 
AAGAAAATTT 
TGT CACTGCC 
TAGAATCAGT 
ACCAGACATT 
TATCTATAAT 
TAGAAAGGAT 
TACAGGTTTA 
CTAATTTTAA 
TTCCCTTATT 
GCTGTTTGGC 
GTGTGTGTGT 
GCAGCTGCTT 
GGGTGGCACT 
ATGCCCCTAG 
GTGAGATGAT 
CTTTTTGCCC 
CTAANCCCCT 
TAGTTAATTG 
GGCCTGATTT 
GTCTCATTTA 
GACCAGAGGA 
TCCTTGATTG 
AACCTTTGAA 



31 
i 

CCAGCTTGGT 
CTGTCCCTTT 
AGGAAAGAGG 
GCAAAGACTG 
AGGGGAATTT 
GGAAACAGAT 
TCAGTCTCTG 
TAAGACATCC 
CGCCCACTGT 
CAAGAAGGTA 
GTCCTCTGAC 
TGACAACATC 
GATCGGAAGC 
CTTTAAAAAG 
ATCTGCCAAT 
GAACAAGGAC 
GAAGGCTGTG 
TGATATCACA 
TGGAAAACAG 
TGGTCCTGAA 
AGT CATGAAG 
GACTTCAGCC 
CGGAACCTCC 
CACCAGTCCT 
CTCGGACTCG 
AATCCAAGCC 
GCTTTCAAGT 
GTTTATTTTC 
TAGATTGATA 
CCTTTCAATG 
AGTTTTCCTT 
AAAAAAAACT 
TCAAGAATGG 
T CCTG AT TG A 
AAACCAACAA 
GAGAATAGAC 
AATTCCTGGT 
TGG AG TAAGG 
TACATGAACT 
CACTGAAAAC 
CAAGAAATCA 
GGCTCCTTTT 
ACCAGAAAAA 
AAACAGTAAC 
TTTTTGATAG 
CTAATTATAT 
CCTAATATTT 
TTCTCTTTAC 
TAACACTGCT 
TTGAAGGTCT 
CCTTGGTAAT 
TACTGAATGG 
GTGGTGGTGG 
CAAAATTAAG 
GCTGATGTGC 
ACAAGCTTCA 
GGTAGTACTG 
CCTCTCCTTT 
ATTTCTTTCT 
GGAAAAAGTG 
TAAAATTCAG 
GTCCATCACC 
AGAATCCAGA 
CGGT AT AT GT 
CCAACAATNT 



41 
I 

GGGGAAAGGG 
AAAGGAGAAT 
GCTTGGAATA 
CTTCCTAAGC 
TGTCAGGCTA 
GCCAGTTTTA 
AGGTTCCACC 
AGGAACATGC 
AGCTTCTACC 
CGTTTCTACC 
CGTTTTCGCA 
AACCTGCCTC 
ATGGATGAAC 
GTGGAGTACA 
ATGAAAG CCC 
TTTGTGCGCC 
CGTGTGCTTC 
GAAGCCATCA 
GTAACTTGTC 
AAATTTCGCT 
GGAAACCCAT 
AAGAGCCCTG 
AGCAGCCAGC 
GGCAGCCTCC 
CTTGGTGATT 
TATCATTGTA 
TTTTATTTTG 
CTGTGATTTC 
ACCATCCTTT 
GAAAGCTTAG 
TTGTAGAGGG 
CATTGGCAGA 
TGGAGGACCC 
GGCCCGGGTT 
CTTATAATTG 
AGAATTGGAA 
CAATCTCTCC 
GACTTCATAT 
GTATGGTATC 
ACTGTGAGAA 
ATATCCTTTT 
T T AT AAACTG 
AAAAAAAAAG 
CTCCAGGAGA 
CTTTTTAACA 
TTTAAATGAA 
CATACTGAAG 
TAAGGACTGA 
TTTTTTTTCC 
TGCTTGCCAN 
GGTGCAAATN 
CTTGCAGTTG 
TGGGAGGGGG 
AAATACTACA 
ACTGTGTAGG 
GATGTCTGTA 
GTTTCTGGTG 
TTTTGTAAAC 
AGAAGCTCAG 
ATACTTGGAT 
GCCAGAACCC 
TTTATTTTAA 
TTTCCTTATG 
ACTACTAGAA 
TCAATAACAA 



51 
I 

TTTGATGAAT 
CTTAGTTTAT 
AAATGAAAAC 
TGGAGATGCT 
TGGATTCATT 
ATGTATTTAG 
AAAATATGGA 
GAGGCTCCCG 
G AAC CAG AAC 
GCAATGGGGA 
GCTTTGACGC 
AGGGAGTGCG 
TGGAGGAAGG 
CCAAGAATGT 
CCCAGTCCTT 
CCAAGCTGGT 
TGAACAAGAA 
AACTGGAGAC 
TCCATGATTT 
ATGCTCAGGA 
CAGCCACAGC 
GTCCTATGCG 
TCTCTACCCC 
GG AAG CACAA 
CCATGTAAAG 
GTAGGGTACT 
TTGTTGTTGT 
TCCTCTGGGC 
GGGGCAGCAT 
GGGCCTGGGG 
GTGTTTAAAT 
TCCAAGAATG 
TGGAAGGACA 
TGTTGTCCAG 
TGACACCAGA 
AATACTGCAG 
ACTGAGGCAA 
ACCTGATTCC 
CATCTATCTC 
TTTGTTTTCA 
TATAAAAATT 
GTGATTTTTC 
CCGAAGAATA 
AAACAAGATG 
GTTATGCTTG 
ATGTTACAGC 
ACACAGAAAT 
TCATTTGAAA 
TGTAAACATA 
TCCTGTGTTG 
TTTGGAAAGG 
TTCCTCCACT 
TGGTGCATGT 
AGACACCCCT 
GGGGAACCCA 
GCTACCAAAA 
AAATTGAAAA 
CCATTCAAAA 
GGTTTNCTTA 
TAGGGGGTGT 
CCAATGACTC 
GTTGAGGAAG 
CTTGGGCCTC 
AATACCAAAT 
TAGTACATCT 



60 
12 0 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
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TCCATCTTAC 
AGGGGATGAG 
TTGTTTTAAA 
CCACCCCTGT 
TGTTAATTTT 
ACTTCTCCCT 
TTCCTACCTC 
ATGTATATAT 
AT TG AGAGAA 
GCTTTGTGTC 
GAAGGAACCT 
AGGAAACCGA 
GATTGGGTTT 
TATTGCCTTC 
ACATGCTGCT 
CCCTGCATTC 
ATTGAGGGCC 
TGCTCCATCG 
GAATGGAGGA 
CTTTCCAGGC 
ATANCTTTGT 
GGTACCATTC 
AACCTGGTCT 
GAGGACAATT 
TAAACATTGG 
CATCGTCTTG 
CAAACACATG 
TTCAGTTNTA 
CCTCCTTCTC 
TGAAGAAGGC 
GTGATTGGTG 
GGTACAATGC 
TCCATATCCC 
TGATGGGAAT 
CCAGATAGAA 
ATGGAAATAA 
AGGGCCACTT 
GCTTTAAGTC 
TGAGGCATGA 
TCCTAAAGCC 
CACCCANACT 
CCCGCTTTGG 
TTTTTTTTTG 
CTCGCTGCAA 
CGAGTAGCTG 
TTT TAGTAGA 
ATTATCTGCC 
GCTGACAAGA 
GGTGATTTTT 
TTAAGGCATC 
CAACAGAAGT 
TTAGGTCAAT 
TCTTTGACTT 
AGTCTCTCTT 
CTTATTATCT 
TTCTTAGCCT 
CTGGTCCTAC 
TTTCTTCTTC 
TATAGCTCAT 
CCTTTTTAGT 
GAGAAAAAAT 
GTG CCCATAA 
GTCATTTGTT 
ATTAAACTCT 
ACTGGTAGGC 
AAAGAGACAT 
CTTGACACCA 
TAAAGAAGCC 
TCACTGCTTG 
AT CC AAAAGG 
GTAATATATT 
TTTATTGAAT 
NTGTGCCATT 
AAAATGGAAA 
CAAAACAGCT 
TGGAGAGTAA 
GAATATATTC 
CCAGTTGTCT 
TCAGCAAACA 
AGTTATTGAT 
TCAGTGGTAA 
AAT CACATGT 
GATAGAGACC 
AAAAATGAGA 
AG CCAGAAAA 
ACCTAACCTA 
TGGTTTGCTG 



TTTTAATCGA 
GCTTGGCATA 
TTGGCCCACT 
CATTCACTTC 
TGCACGGTCT 
CTTTTTTACA 
CCTGATTTTT 
TGGGGCTGGG 
AAGCTCCTTT 
CTTATGGACT 
TAAGATCACA 
GACACAGAGG 
ACAACCCACA 
CATTAGGCTC 
GCCCTGATCT 
ACCTGGTTCC 
AATAGGAGCA 
TGAGGAGCCC 
AGATTGATTT 
TGAGGGAAAT 
TCATCCTAAC 
ACTGGCANGA 
CACTGTGGTT 
TCCAGGTATA 
CTCCTGTGTT 
TGTACACTGC 
GTTTTCCTTG 
AGAGACCTCC 
CTCCACAGTC 
AAGGAACCCT 
CTTACCTTGA 
TCCCAATCAC 
TAGGACAAGA 
GATCCCAANG 
NCACTGGGAC 
AAGGCATTGA 
GGATCCATTT 
CCAGACTGGT 
GAATGTTGCC 
TGGTCCCCAA 
CTTAGTGTTG 
CTTAGCTAGC 
ACTGAGTCTC 
CCTTCACCCT 
GGATTACAGG 
GATGGGGTTT 
CACCTCGGCC 
CTAATTTTTT 
TCTTACCTTG 
TTTCTGCTCC 
CACCTTGTAA 
AACCTTGAGG 
TTCTTTCTCT 
TCCACAGTAC 
TTATTTGTAC 
GTGATTTTGC 
CCCAGTCCAA 
TCCATTTTCA 
GTATCTTTAG 
CTGACATTTT 
CCACCCATGG 
TTTTTAAAGC 
TTGGCTGGAT 
CTATAATAAT 
AATCGGAGTT 
TTGCTTAATT 
ACTGTTCATG 
AGATTGTAGG 
GCAATACCAT 
GATTTGAACA 
GCAGCTTGAA 
TTTGCATTTC 
AAACTTGTAC 
CAGCCCACCC 
GTAATTGGTG 
ATGCATGGTA 
TTCTTTGTAG 
TACAGTTGTA 
ACAAACAAAC 
CATTTCTTAA 
ATTGGGGTTG 
AATCCAAAGA 
TCAGAAGACT 
GAAATAAAAC 
AAAAACAAGG 
CTCTGAAATT 
ACCCCACTTG 



GTATAAGGAA 
GTCCAAAATT 
TTCAAGGCAA 
CAATTTTACG 
ACACACATCA 
CACACACACA 
CTTCCCTACA 
CTGAACAACT 
TCTCTTCACT 
TTAGTATTAG 
TCATCTACTC 
TAAAGTAATT 
TCTCCTGGCT 
CTGAGAGTTA 
CAGTGGGAAA 
CATCCACATG 
ATGGGGTCCC 
TCTGAATAGC 
TCTCCATCAG 
GTTTCTTGTT 
TTTCTGAGAT 
TTTNTTTTAG 
GCCCTCATCC 
AGCAAGGGGC 
TGCACCAAAA 
TCCTGTGGCC 
CTGCAAGGCT 
TTCTGGGCTT 
ACAAGTAACC 
GAGATTCTTC 
ACAAAATTTT 
CCTGCACATT 
NAACAGGATG 
ATCACCCCAC 
AGTGGTTTGA 
TTTTTTAAAA 
CCAGGCCTTA 
CTCCCAAGTG 
CCATCTATCC 
AAATTGTTTT 
CGTCCTGCCT 
GTGACATTGG 
CCTCTGTCAC 
TCACCTCCCA 
CGTGCGCCAC 
CACCATGTTG 
TCCCAAAGTG 
ATCCCTTGGT 
GATGCCTGAG 
TGATCAGAAG 
GTAAGGCAAA 
GAATCAATGG 
GTCTAGTTTC 
AAACAT CCAT 
TTTTTCCTTC 
CTTGGGACTG 
TCAGAAGTAT 
TTCGTAATCC 
GTCTTTGCCT 
GTGGAGCAGT 
ATTTAT AT CA 
TGCAATATAA 
GGGGGTGGGG 
CTTGTTTGGG 
GATTTAAATG 
GACATGTATT 
ATACTGAATA 
TGTTAATTTA 
ATGGCATGCC 
AGTAAGAGGT 
GCCAATGATC 
CCACGTGTGG 
AGAAAATGTT 
TTTCTGCCCT 
GTTGTAGTGT 
TTGTACATCA 
TCCTTCTTCC 
AATATCTGAT 
CAAAATGTGG 
GGAACAGCAT 
TATTGGCCAT 
CAGTAGGTAG 
CTGCTTGACC 
AGATATTTAA 
GCATGAGTTC 
GTGATT CAAA 
GACTGGTAGG 



ATGTTTCTTT 

TAAGNCTCCA 

TTTTTTTTGT 

CAATCCAATT 

AGTCAGCAAG 

CACACACACA 

GAAATAGAAA 

AACTTCATAA 

GTTTTGGAAA 

CCTAGATTGA 

CTCTACTCCA 

TCCCCAAGGT 

CTTATTCCAG 

TTTCTCAGGG 

TNCACCCAGC 

GGTTGCAGAT 

TGGCCTTGTC 

CCCCCACTGA 

TTCACCTTGT 

TCCANAGTAN 

GGCTTTTCAA 

AATATGGGAG 

ACAATGTCCC 

TTTGTGACAA 

TAGCAAGCTG 

TTCCACAGCA 

NTTCCTGGGA 

ACCCCACTCC 

AAGGAACCTG 

TTTGAATCCT 

GTCTGTGTTC 

TGATTCTAAA 

CCTATATCCC 

CTCAGAAAAC 

ACGACTTCTT 

AAGATGATTG 

CTCATATATT 

AACCATAAGT 

CTTCAGGAAA 

TGTCTCCAAA 

TGTTTCCTTG 

CTATCATTTG 

CTAGGCTGGA 

GGTCGAAGCG 

CAAATCTGGC 

GCCAGACTGG 

CTGGGATTAC 

TTATTGGCTT 

ACTAGGGGAG 

GGCAGGTTAG 

GACTTTGAAG 

CTTTTTTGCC 

CTCTGTTCTC 

CCTTTCTCCT 

CTCCCTGTCT 

ATGATAAATT 

GTTGGTGGGG 

CCCTCAGCAG 

TCCAAGCACT 

GAAGCGTGCT 

GCTAAATACT 

TATAATGAGG 

GAGTAATTGC 

GCTTGCTAAC 

AAAAGATAAT 

TTTTCCTTCT 

GACAGTCCAT 

TTAAACAGAA 

AAAATTTACA 

TATGCCAAAA 

CCTTATGACT 

TAAGTCTTTA 

TTTATGGCCA 

ATAGCTGTAG 

TAGAGGTGTT 

CATTTCTTAA 

CACCCCCTTG 

TTGAGGCCCA 

GGAAAAGGCA 

TGTGATCAAA 

TGATTACATT 

TGATGTCCCT 

GATGACCAAT 

GAACTTTAGC 

AAATGCATTA 

AGCAGTATTT 

TTTGGTGAGG 



ATGGCCATTT 

ATAATTAATT 

GTGTCTGTAA 

TTAGCACTCA 

CATTTGCCAC 

CACAATCCAT 

TAGGGACAAA 

GTAGTATTAA 

GGATAGCCAT 

ATTATAGCGT 

AATTTCTCAT 

CACACAGCTG 

GGCCTTTTCC 

TCATGTTGCA 

AACCTAATAC 

GTCCTTGAAG 

CATCTGATTC 

ATGCTTGCCT 

GTCATCTCAT 

AAAAAAGAAA 

CATTTAAAAA 

TAAGATGAGG 

CAAAGCCATC 

AAATGTACCC 

TGTGCTCTAT 

GAAACCAGGG 

ACTAAGGGGG 

TCAGGTACTT 

AAAGTGGATG 

TTAGTCCAAG 

CTAATCCCTT 

TGGCTTTTAT 

C AAAATG AG C 

GTCTGTGCCA 

TTATGGTTGT 

GAACCTGTCT 

GCCTTCACTG 

GTTTTGGAGC 

AGGTGCCTTC 

AGTCTAGTAT 

TTAAGGATCT 

ACAAGACTAA 

GTGCAGTGGC 

ATTCTCCTGC 

TATTTTTTTA 

TCTTGAACTC 

AGGCATGAGC 

CAACATCTTC 

TATAGAATTC 

TTGGGAGAGG 

GCATTAGCGT 

GCTCTACCTC 

AGTTTATATT 

GTGCAATTCT 

AGGCATTGGG 

ATTTCCAGAT 

AATCAACCTG 

ATCTTTACAA 

GTACAGAATA 

CAGAGACATA 

AATAATTGAT 

GACCACAGGT 

TTAAAGTTTT 

TGTTGAGCTG 

TTAACAAATC 

GAGTCACCTA 

ATAAGAGAAA 

TTGCAAAGCC 

ATGACTTTTC 

TGTCTCCAAT 

TGTATACAAC 

AAATGTTTTT 

TTTTCAAAGG 

TTAGAATTGA 

AGCTTGCTAG 

CTCGTTTTAA 

CCCTCTCCCT 

ATAACTCTTG 

TTTCTCAACC 

GACTCAACTT 

CAGGATTGAA 

TATCCCTGCA 

AATTATTTGA 

CACCTATTTA 

CTATCAGTGT 

CAAGAGGCAT 

CCCCCATAAA 



TGGAGGGAGC 3960 

GCATTTTAAA 4020 

CTGAGCTCCT 40 80 

AGTT CCATTG 4140 

CACTCCCTAT 42 00 

CTCTTGCTTG 42 60 

GAAGGGGAAA 432 0 

CTAGGGGTAA 43 80 

TAGCATGACT 4440 

TTTTCTAGCT 4500 

TCTTCAGGCC 4560 

GCTGGGGCAG 4620 

CACTAAGTAG 4680 

TCTTGGAGCC 4740 

AGCCCCTTTT 4800 

AGAGTGAGGC 4860 

AGGAGATCAC 4 920 

TGCCCAAATG 4 980 

AATGGTTGGT 5040 

GAGTGGAACA 5100 

AAACTAGTGT 5160 

TAGAGAAAAT 522 0 

CTGCTNTGAT 5280 

TGG CTGATGT 5340 

ACACTCTTCC 540 0 

CAAAAGGGTC 5460 

TATTTATTAG 552 0 

CTCTCTCCTT 5580 

TGTAGCTATT 5640 

T C T TAG AC C A 570 0 

C AAT A CTNTG 5760 

TTTTTAAAAA 582 0 

TCCAGGACAC 5880 

ANAGACTT CC 5940 

CCAGTTTGCT 600 0 

TTGGCCACAT 6060 

AAGGGCTTTG 612 0 

TCATCTGGGG 6180 

CCTCCCTTTC 6240 

GGTCTTTATA 6300 

ATGCANACCT 63 60 

CTTTTTTTTT 6420 

ACAATCTTGG 6480 

CTCAGTCTCC 6540 

TTATTATTAT 6600 

TTGGCCTCAA 6660 

ACCATGCCCA 6720 

TGGAAT CAGA 6780 

CAATTGGTAA 6840 

TCAGATGGCA 6 90 0 

TTCTCATTAC 6 960 

TTTGTGTATC 7 02 0 

CTATGTTATC 7080 

GTCTCTCCCT 7140 

CATGTGCCTC 72 0 0 

T CAAT CAGCC 7260 

ATCCTGGCCC 732 0 

GCAGTTTCCT 73 80 

CTTTGTGGTT 7440 

ATCAGCTGAA 750 0 

TTTGTTTGAT 7560 

AATTTCTCCT 762 0 

ACCATTACAC 7 680 

TTTTAACTAA 7740 

TAT ACTAT AA 780 0 

AACATTTACT 7 860 

TTAGTGGACC 7 92 0 

CTTGGAAATG 7 980 

TTTATAAGTT 8 040 

GTATGGTCCT 810 0 

TAATGCATGT 8160 

GATCACCTTT 822 0 

GAGAAAGTTT 8280 

GTACCTGTAG 8340 

TGACTAGCTT 840 0 

CCTCTGAAAA 8460 

CTCCCTGCTC 852 0 

CCAAGTAAAG 8580 

ATCTCTCAGC 8640 

TACGTAAAAA 870 0 

TAG TTTTCAG 8760 

GCTGTTTTAA 882 0 

AAAAAAAAGA 8880 

GAATAGTTAT 8940 

CCTAGGCAAT 9000 

TCTCCTTTTT 9060 

CCAGCTGGAG 912 0 
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CAGACCCTTT TCATCTCCTG TGCCTGTAAC 
AATGAGGGCT TTCTTGGGTC AGAGGACTTC 
TAAGGTGCTG TGAACTGTGA GTGCTGAAGA 
AGCTGCTCTT GCAATTATTT TGGCTCTCAA 
TGTACATTTG CAAGATGTGT GTAATGTCAT 



Seq ID NO; 214 Protein sequence: 
Protein Accession #: NP 000546 



ACCCCTCTTC CCCCACCCCC TCCGCAATTC 
AAGGTTGTCT AGAGAAGTTT GCCATGTGTG 
TTCGCAGCAT TCAATACCAG GCAGCCAAAG 
GCTCTGTTCT TCATCGCATT CTCATTTCTG 
TTTCCAAAAA TAAAATTTGA TTTCAAT 



1 11 21 31 41 51 

I I I I I I 

MELDFGHFDE RDKTSRNMRG SRMNGLPSPT HSAHCSFYRT RTLQALSNEK KAKKVRFYRN 

GDRYFKGIVY AVSSDRFRSF DALLADLTRS LSDNINLPQG VRYIYTIDGS RKIGSMDELE 

EGESYVCSSD NFFKKVEYTK NVNPNWSVNV KTSANMKAPQ SLASSNSAQA RENKDFVRPK 

LVTIIRSGVK PRKAVRVLLN KKTAHSFEQV LTDITEAIKIi ETGWKKLYT LDGKQVTCLH 

DFFGDDDVFI ACGPEKFRYA QDDFSLDENE CRVMKGNP S A TAGPKASPTP QKTSAKSPGP 

MRRSKSPADS ANGTSSSQLS TPKSKQSPIS TPTSPGSLRK HKDLYLPLSL DDSDSLGDSM 



Seq ID NO: 215 DNA sequence 
Nucleic Acid Accession #: NM_130467 
Coding sequence: 3 12.. 644 

1 11 21 31 41 51 

I I I I I I 

GGCACGAGGC AGAGCTCTGC AAGGAGAGGT TGTGTCTTCG TTCTTTCCGC CATCTTCGTT 

CTTTCCAACA TCTTCGTTCT TTCTCACTGA CCGAGACTCA GCCGGTAGGT CTGCAGAGTG 

GTCTTCCTGG TAATTTAGTT GTGAGTGAAT GTGTGGAGGA GCCAGCGGGC TTAGGACAGG 

TCCTGTGGCA CAGTCCGTGG CTTTGAGGGA AAAGGGCCTC GCGGTGGTCC TCCGCCTTCC 

CCCAGGTCGT GATGCAGGCG CCATGGGCCG GTAATCGTGG CTGGGCTGGA ACGAGGGAGG 

AAGTGAGAGA TATGAGTGAG CATGTAACAA GATCCCAATC CTCAGAAAGA GGAAATGACC 

AAGAGTCTTC CCAGCCAGTT GGACCTGTGA TTGTCCAGCA GCCCACTGAG GAAAAACGTC 

AAGAAGAGGA ACCACCAACT GATAATCAGG GTATTGCACC TAGTGGGGAG AT CAAAAATG 

AAGGAGCACC TGCTGTTCAA GGGACTGATG TGGAAGCTTT TCAACAGGAA CTGGCTCTGC 

TTAAGATAGA GGATGCACCT GGAGATGGT C CTGATGTCAG GGAGGGGACT CTGCCCACTT 

TTGATCCCAC TAAAGTGCTG GAAGCAGGTG AAGGGCAACT ATAGGTTTAA ACCAAGACAA 

ATGAAGACTG AAACCAAGAA TATTGTTCTT ATGCTGGAAA TTTGACTGCT AACATTCTCT 

TAATAAAGTT TTACAGTTTT CTGCAAAAAA AAAAAAAAAA AAA 



Seq ID NO; 216 Protein sequence: 
Protein Accession #: NP_569734 

1 11 21 31 41 51 

I I 1 I I I 

MSEHVTRSQS SERGNDQESS QPVGPVIVQQ PTEEKRQEEE PPTDNQGIAP SGEIKNEGAP 

AVQGTDVEAF QQELALLKIE DAPGDGPDVR EGTIiPTFDPT KVLEAGEGQL 

Seq ID NO: 217 DNA sequence 

Nucleic Acid Accession #: NM_001476.1 

Coding sequence: 82.. 435 

1 11 21 31 41 51 

I 1 1 I I I 

GCCAGGGAGC TGTGAGGCAG TGCTGTGTGG TTCCTGCCGT CCGGACTCTT TTTCCTCTAC 

TGAGATTCAT CTGTGTGAAA TATGAGT TGG CGAGGAAGAT CGACCTATTA TTGGCCTAGA 

CCAAGGCGCT ATGTACAGCC TCCTGAAGTG ATTGGGCCTA TGCGGCCCGA GCAGTTCAGT 

GATGAAGTGG AACCAGCAAC ACCTGAAGAA GGGGAACCAG CAACTCAACG TCAGGATCCT 

GCAGCTGCTC AGGAGGGAGA GGATGAGGGA GCATCTGCAG GTCAAGGGCC GAAGCCTGAA 

GCTGATAGCC AGGAACAGGG TCACCCACAG ACTGGGTGTG AGTGTGAAGA TGGTCCTGAT 

GGGCAGGAGG TGGACCCGCC AAATCCAGAG GAGGTGAAAA CGCCTGAAGA AGGTGAAAAG 

CAATCACAGT GTTAAAAGAA GACACGTTGA AATGATGCAG GCTGCTCCTA TGT TGGAAAT 

TTGTTCATTA AAATTCTCCC AATAAAGCTT TACAGCCTTC TGCAAAA 

Seq ID NO: 218 Protein sequence: 
Protein Accession #: NP_001467.1 

1 11 21 31 41 51 

I I I I I I 

MSWRGRSTYY WPRPRRYVQP PEVIGPMRPE QFSDEVEPAT PEEGEPATQR QDPAAAQEGE 

DEGASAGQGP KPEADSQEQG HPQTGCECED GPDGQEVDPP NPEEVKTPEE GEKQSQC 



Seq ID NO: 219 DNA sequence 
Nucleic Acid Accession #: NM_001476 
Coding sequence; 90-3671 



1 11 21 31 41 51 

I 1 1 I i 1 

ACAGCGGAGC GCAGAGTGAG AACCACCAAC CGAGGCGCCG GGCAGCGACC CCTGCAGCGG 

AGACAGAGAC TGAGCGGCCC GGCACCGCCA TGCCTGCGCT CTGGCTGGGC TGCTGCCTCT 

GCTTCTCGCT CCTCCTGCCC GCAGCCCGGG CCACCTCCAG GAGGGAAGTC TGTGATTGCA 

ATGGGAAGTC CAGGCAGTGT ATCTTTGATC GGGAACTTCA CAGACAAACT GGTAATGGAT 

TCCGCTGCCT CAACTGCAAT GACAACACTG ATGGCATTCA CTGCGAGAAG TGCAAGAATG 

GCTTTTACCG GCACAGAGAA AGGGACCGCT GTTTGCCCTG CAATTGTAAC TCCAAAGGTT 
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CTCTTAGTGC TCGATGTGAC AACTCTGGAC GGTGCAGCTG TAAACCAGGT GTGACAGGAG 42 0 

CCAGATGCGA CCGATGTCTG CCAGGCTTCC ACATGCTCAC GGATGCGGGG TGCACCCAAG 480 

ACCAGAGACT GCTAGACTCC AAGTGTGACT GTGACCCAGC TGGCATCGCA GGGCCCTGTG 540 

ACGCGGGCCG CTGTGTCTGC AAGCCAGCTG TTACTGGAGA ACGCTGTGAT AGGTGTCGAT 600 

CAGGTTACTA TAATCTGGAT GGGGGGAACC CTGAGGGCTG TACCCAGTGT TTCTGCTATG 660 

GGCATTCAGC CAGCTGCCGC AGCTCTGCAG AATACAGTGT CCATAAGATC ACCTCTACCT 720 

TTCATCAAGA TGTTGATGGC TGGAAGGCTG TCCAACGAAA TGGGTCTCCT GCAAAGCTCC 780 

AATGGTCACA GCGCCATCAA GATGTGTTTA GCTCAGCCCA ACGACTAGAC CCTGT CTATT 840 

TTGTGGCTCC TGCCAAATTT CTTGGGAATC AACAGGTGAG CTATGGGCAA AGCCTGTCCT 900 

TTGACTACCG TGTGGACAGA GGAGGCAGAC ACCCATCTGC CCATGATGTG ATTCTGGAAG 960 

GTGCTGGTCT ACGGATCACA GCTCCCTTGA TGCCACTTGG CAAGACACTG CCTTGTGGGC 102 0 

TCACCAAGAC TTACACATTC AGGTTAAATG AGCATCCAAG CAATAATTGG AGCCCCCAGC 1080 

TGAGTTACTT TGAGT AT CGA AGGTTACTGC GGAATCTCAC AGCCCTCCGC ATCCGAG CTA 1140 

CATATGGAGA ATACAGTACT GGGTACATTG ACAATGTGAC CCTGATTTCA GCCCGCCCTG 12 0 0 

TCTCTGGAGC CCCAGCACCC TGGGTTGAAC AGTGTATATG TCCTGTTGGG TACAAGGGGC 12 60 

AATTCTGCCA GGATTGTGCT TCTGGCTACA AGAGAGATTC AGCGAGACTG GGGCCTTTTG 132 0 

GCACCTGTAT TCCTTGTAAC TGTCAAGGGG GAGGGGCCTG TGAT CCAGAC ACAGGAGATT 1380 

GTTATTCAGG GGATGAGAAT CCTGACATTG AGTGTGCTGA CTGCCCAATT GGTTTCTACA 1440 

ACGATCCGCA CGACCCCCGC AGCTGCAAGC CATGTCCCTG T CAT AACGGG TTCAGCTGCT 1500 

CAGTGATGCC GGAGACGGAG GAGGTGGTGT GCAATAACTG CCCTCCCGGG GTCACCGGTG 1560 

CCCGCTGTGA GCTCTGTGCT GATGGCTACT TTGGGGACCC CTTTGGTGAA CATGGCCCAG 162 0 

TGAGGCCTTG TCAGCCCTGT CAATGCAACA ACAATGTGGA CCCCAGTGCC TCTGGGAATT 1680 

GTGACCGGCT GACAGGCAGG TGTTTGAAGT GTATCCACAA CACAGCCGGC ATCTACTGCG 1740 

ACCAGTG CAA AGCAGGCTAC TTCGGGGACC CATTGGCTCC CAACCCAGCA GACAAGTGTC 1800 

GAGCTTGCAA CTGTAACCCC ATGGGCTCAG AGCCTGTAGG ATGTCGAAGT GATGGCACCT 1860 

GTGTTTGCAA GCCAGGATTT GGTGGCCCCA ACTGTGAGCA TGGAGCATTC AGCTGTCCAG 192 0 

CTTGCTATAA TCAAGTGAAG ATTCAGATGG AT C AGTTT AT GCAGCAGCTT CAGAGAATGG 1980 

AGGCCCTGAT TTCAAAGGCT CAGGGTGGTG ATGGAGTAGT ACCTGATACA GAGCTGGAAG 2 040 

GCAGGATGCA GCAGGCTGAG CAGGCCCTTC AGGACATTCT GAGAGATGCC CAGATTTCAG 210 0 

AAGGTGCTAG CAGATCCCTT GGTCTCCAGT TGGCCAAGGT GAGGAGCCAA GAGAACAGCT 2160 

ACCAGAGCCG CCTGGATGAC CTCAAGATGA CTGTGGAAAG AGTT CGGGCT CTGGGAAGTC 222 0 

AGTACCAGAA CCGAGTTCGG GATACTCACA GGCTCATCAC T CAGATGC AG CTGAGCCTGG 22 80 

CAGAAAGTGA AGCTTCCTTG GGAAACACTA ACATTCCTGC CTCAGACCAC TACGTGGGGC 2340 

CAAATGGCTT TAAAAGTCTG GCT CAGGAGG CCACAAGATT AGCAGAAAGC CACGTTGAGT 2400 

CAGCCAGTAA CATGGAGCAA CTGACAAGGG AAACTGAGGA CTATTCCAAA CAAGCCCTCT 2460 

CACTGGTGCG CAAGGCCCTG CATGAAGGAG TCGGAAGCGG AAGCGGTAGC CCGGACGGTG 2520 

CTGTGGTGCA AGGGCTTGTG GAAAAATTGG AGAAAACCAA GTCCCTGGCC CAGCAGTTGA 25 80 

CAAGGGAGGC CACTCAAGCG GAAATTGAAG CAGATAGGTC TTATCAGCAC AGTCTCCGCC 2 640 

TCCTGGATTC AGTGTCTCGG CTTCAGGGAG TCAGTGATCA GTCCTTTCAG GTGGAAGAAG 2700 

CAAAGAGGAT CAAACAAAAA GCGGATTCAC TCTCAACGCT GGTAACCAGG CATATGGATG 2760 

AGTTCAAGCG TACACAAAAG AATCTGGGAA ACTGGAAAGA AGAAGCACAG CAGCTCTTAC 2 820 

AGAATGGAAA AAGTG GGAG A GAGAAATCAG AT CAGCTGCT TTCCCGTGCC AATCTTGCTA 2880 

AAAGCAGAGC ACAAGAAGCA CTGAGTATGG GCAATGCCAC TTTTTATGAA GTTGAGAGCA 2 940 

TCCTTAAAAA C C T CAG AG AG TTTGACCTGC AGGTGGACAA CAGAAAAGCA GAAGCTGAAG 30 0 0 

AAGCCATGAA GAGACTCTCC TACATCAGCC AGAAGGTTTC AGATGCCAGT GACAAGACCC 30 60 

AGCAAGCAGA AAGAGCCCTG GGGAGCGCTG CTGCTGATGC ACAGAGGGCA AAGAATGGGG 312 0 

CCGGGGAGGC CCTGGAAATC TCCAGTGAGA TTGAACAGGA GATTGGGAGT CTGAACTTGG 3180 

AAGCCAATGT GACAGCAGAT GGAGCCTTGG CCATGGAAAA GGGACTGGCC TCTCTGAAGA 3240 

GTGAGATGAG GGAAGTGGAA GGAGAGCTGG AAAGGAAGGA GCTGGAGTTT GACACGAATA 3300 

TGGATGCAGT A C AG ATGGTG ATTACAGAAG CCCAGAAGGT TGATACCAGA GCCAAGAACG 3 3 60 

CTGGGGTTAC AATCCAAGAC ACACTCAACA CATTAGACGG CCTCCTGCAT CTGATGGACC 342 0 

AGCCTCTCAG TGTAGATGAA GAGGGGCTGG TCTTACTGGA GCAGAAGCTT TCCCGAGCCA 3480 

AGACCCAGAT CAACAGCCAA CTGCGGCCCA TGATGTCAGA GCTGGAAGAG AGGGCACGTC 3540 

AGCAGAGGGG CCACCTCCAT TTGCTGGAGA CAAGCATAGA TGGGATTCTG GCTGATGTGA 3 60 0 

AGAACT TGGA GAACATTAGG GACAACCTGC CCCCAGGCTG CTACAATACC CAGGCTCTTG 3 660 

AGCAACAGTG AAGCTGCCAT AAATATTTCT CAACTGAGGT TCTTGGGATA CAGATCTCAG 3 72 0 

GGCTCGGGAG CCATGTCATG TGAGTGGGTG GGATGGGGAC ATTTGAACAT GTTTAATGGG 3780 

TATGCTCAGG TCAACTGACC TGACCCCATT CCTGATCCCA TGGCCAGGTG GTTGTCTTAT 384 0 

TGCACCATAC TCCTTGCTTC CTGATGCTGG GCAATGAGGC AGATAGCACT GGGTGTGAGA 3 900 

ATGATCAAGG ATCTGGACCC CAAAGAATAG ACTGGATGGA AAGACAAACT GCACAGGCAG 3 960 

ATGTTTGCCT C ATAATAGT C GTAAGTGGAG TCCTGGAATT TGGACAAGTG CTGTTGGGAT 4020 

ATAGTCAACT TATTCTTTGA GTAATGTGAC TAAAGGAAAA AACTTTGACT TTGCCCAGGC 4080 

ATGAAAT TCT TCCTAATGTC AGAACAGAGT GCAACCCAGT CACACTGTGG CCAGTAAAAT 4140 

ACTATTGCCT CATATTGTCC TCTGCAAGCT TCTTGCTGAT CAGAGTTCCT CCTACTTACA 4200 

ACCCAGGGTG TGAACATGTT CTCCATTTTC AAGCTGGAAG AAGTGAGCAG TGTTGGAGTG 42 60 

AGGACCTGTA AGGCAGGCCC ATTCAGAGCT ATGGTGCTTG CTGGTGCCTG CCACCTTCAA 4320 

GTTCTGGACC TGGGCATGAC ATCCTTTCTT TTAATGATGC CATGGCAACT TAG AGAT TG C 43 80 

ATTTTTATTA AAGCATTTCC TACCAGCAAA GCAAATGTTG GGAAAGTATT TACTTTTTCG 4440 

GTTTCAAAGT GATAGAAAAG TGTGGCTTGG GCATTGAAAG AGGTAAAATT CTCTAGATTT 450 0 

ATTAGTCCTA ATTCAATCCT ACTTTTCGAA CACCAAAAAT GATGCGCATC AATGTATTTT 4560 

ATCTTATTTT CTCAATCTCC TCTCTCTTTC CTCCACCCAT AATAAGAGAA TGTTCCTACT 462 0 

CACACTTCAG CTGGGTCACA TCCATCCCTC CATTCATCCT TCCATCCATC TTTCCATCCA 4680 

TTACCTCCAT CCATCCTTCC AACATATATT TATTGAGTAC CTACTGTGTG CCAGGGGCTG 4740 

GTGGGACAGT GGTGACATAG TCTCTGCCCT CATAGAGTTG ATTGTCTAGT GAGGAAGACA 480 0 

AGCATTTTTA AAAAATAAAT TTAAACTTAC AAACTTTGTT TGTCACAAGT GGTGTTTATT 4860 

GCAATAACCG CTTGGTTTGC AACCTCTTTG CTCAACAGAA CATATGTTGC AAGACCCTCC 4 92 0 

CATGGGGGCA CTTGAGTTTT GGCAAGGCTG ACAGAGCTCT GGGTTGTGCA CATTTCTTTG 4 980 

CATTCCAGCT GTCACTCTGT GCCTTTCTAC AACTGATTGC AACAGACTGT TGAGTTATGA 5040 

TAACACCAGT GGGAATTGCT GGAGGAACCA GAGGCACTTC CACCTTGGCT GGGAAGACTA 5100 

TGGTGCTGCC TTGCTTCTGT ATTTCCTTGG ATTTTCCTGA AAGTGTTTTT AAATAAAGAA 5160 
CAATTGTTAG ATGCC 

Seq ID NO: 220 Protein sequence: 
Protein Accession #:NP_005553 

1 11 21 31 41 51 
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MPALWLGCCL CFSLLLPAAR 
DGIHCEKCKN GFYRHRERDR 
HMLTDAGCTQ DQRLLDSKCD 
PEGCTQCFCY GHSASCRSSA 
SSAQRLDPVY FVAPAKFLGN 
MPLGKTLPCG LTKTYTFRLN 
DNVTLISARP VSGAPAPWVE 
GGACDPDTGD CYSGDENPDI 
CNNCPPGVTG ARCELCADGY 
CIHNTAGIYC DQCKAGYFGD 
NCEHGAFSCP ACYNQVKIQM 
QDILRDAQIS EGASRSLGLQ 
RLITQMQLSL AESEASLGNT 
ETEDYSKQAL SLVRKALHEG 
ADRSYQHSLR LLDSVSRLQG 
NWKEEAQQLL QNGKSGREKS 
QVDNRKAEAE EAMKRLSYIS 
IEQEIGSLNL EANVTADGAL 
AQKVDTRAKN AGVTIQDTLN 
MMSELEERAR QQRGHLHLLE 



ATSRREVCDC NGKSRQCIFD 
CLPCNCNSKG SLSARCDNSG 
CDPAGIAGPC DAGRCVCKPA 
EYSVHKITST FHQDVDGWKA 
QQVSYGQSLS FDYRVDRGGR 
EHPSNNWSPQ LSYFEYRRLL 
QCICPVGYKG QFCQDCASGY 
ECADCPIGFY NDPHDPRSCK 
FGDPFGEHGP VRPCQPCQCN 
PLAPNPADKC RACNCNPMGS 
DQFMQQLQRM EALISKAQGG 
LAKVRSQENS YQSRLDDLKM 
NIPASDHYVG PNGFKSLAQE 
VGSGSGSPDG AWQGLVEKli 
VSDQSFQVEE AKRIKQKADS 
DQLLSRANLA KSRAQEALSM 
QKVSDASDKT QQAERALGSA 
AMEKGLASLK SEMREVEGEL 
TLDGLLHLMD QPLSVDEEGIi 
TSIDGILADV KNLENIRDNL 



RELHRQTGNG FRCLNCNDNT 
RCSCKPGVTG ARCDRCLPGF 
VTGERCDRCR SGYYNLDGGN 
VQRNGSPAKL QWSQRHQDVF 
HPSAHDVILE GAGIiRITAPL 
RNLTALRIRA TYGEYSTGY I 
KRDSARLGPF GTCIPCNCQG 
PCPCHNGFSC SVMPETEEW 
NNVDPSASGN CDRLTGRCLK 
EPVGCRSDGT CVCKPGFGGP 
DGWPDTEbE GRMQQAEQAL 
TVERVRALGS QYQNRVRDTH 
ATRLAESHVE SASNMEQLTR 
EKTKSLiAQQL TREATQAEIE 
LSTLVTRHMD EFKRTQKNLG 
GNATFYEVES ILKNLREFDL 
AADAQRAKNG AGEALEISSE 
ERKELEFDTN MDAVQMV I TE 
VLLEQKLSRA KTQINSQLRP 
PPGCYNTQAL EQQ 



Seg ID NO: 221 DKTA sequence 
Nucleic Acid Accession #: NM_016E 
Coding sequence: 13-1854 

1 11 21 

1 1 1 

GTCAAGAAAA GAATGTCTGT AATTGTTCGA 

AAAGGGGCTG ATAATGTGAT TTTTGAGAGA 

ACATTATGCC ATCTGGAATA CTTTGCCACG 

GCTGATCTCT CTGAGAATGA GTATGAGGAG 

ATATTGAAGG ACAGAGCTCA ACGGTTGGAA 

CTGCTACTTG GAGCCACAGC CATAGAAGAT 

GCAACACTGT TGAAGGCAGA AATTAAAATA 

GCGATTAATA TAGGGTATTC CTGCCGATTG 

AAGGAGGACT CTTTGGATGC CACAAGGGCA 

AATTTGCTGG GCAAGGAAAA TGACGTGGCC 

GCGCTCTCCT TCGAAGT CCG GAGGAGTTTC 

ATATGCTGCA GAGTGTCTCC TCTG CAGAAG 

GTGAAGGCCA TCACCCTCGC CATCGGAGAC 

GCCCACGTGG GTGTGGGAAT CAGTGGGAAT 

TACGCCATCG CACAGTTTTC CTACTTAGAG 

TACAACCGGG TGACCAAGTG CATCTTGTAC 

ATTGAGCTTT GGTTCGCCTT TGTTAATGGA 

TGCATCGGCC TGTACAATGT GATTTTCACC 

GAGAGGTCTT GCACTCAGGA GAGCATGCTC 

AATGGCGAAG GCTTCAACAC AAAGGTTTTC 

TCCCTCATCC TCTTCTGGTT TCCCATGAAA 

GGTCATGCTA CCGACTATTT ATTTGTTGGA 

GTTTGTCTGA AAGCTGGTTT GGAGACCACA 

TGGGGAAGCA TGCTGACCTG GCTGGTGTTT 

ATTCCCATTG CTCCAGATAT GAGAGGACAG 

TGGTTGGGAT TATTTCTGGT TCCTACTGCC 

GCCAAGCACA CCTGCAAAAA GACATTGCTG 

CGAGTCCTGG GAAAAGCGGT GCTGCGGGAT 

CGCCTGATCA AGAGGCTGGG CCGGAAGACG 

CAGCAGGGCG TCCCGCATGG GTATGCTTTT 

GAAGAAGTCA TCCGTGCTTA TGACACCACC 

AATTTTCCTG ACTGATCTTA GGAAAGAGAT 

TTTGTCAGAG AAGACTGGCG TCCAAGGCCA 

AGTTAAGCAG TTTGTTAGTT ACATATTCCC 

AGCTATCTTT GCCCTCCCAA CTCGTCTGCA 

ATGAAGCATT CAACTGTGCT CTGTGAGGTC 

AGAAAAAAAA AAAAAAA 



9 



31 41 51 

1 I ) 

ACTCCTTCAG GACGACTTCG GCTTTACTGT 

CTTTCAAAAG ACTCAAAATA TATGGAGGAA 

GAAGGCTTGC GGACTCTCTG TGTGGCTTAT 

TGGCTGAAAG TCTATCAGGA AGCCAGCACC 

GAGTGTTACG AGAT CATTGA GAAGAATTTG 

CGCCTTCAAG CAGGAGTTCC AGAAACCATC 

TGGGTGTTGA CAGGAGACAA ACAAGAAACT 

GTATCGCAGA ATATGGCCCT TATCCTATTG 

GCCATTACTC AGCACTGCAC TGACCTTGGG 

C T CAT CAT CG ATGGCCACAC CCTGAAGTAC 

CTGGATTTGG CACTCTCGTG CAAAGCGGTC 

TCTGAGATAG TGGATGTGGT GAAGAAGCGG 

GGCGCCAACG ATGTCGGGAT GATCCAGACA 

GAAGGCATGC AGGCCACCAA CAACT CGGAT 

AAGCTTCTGT TGGTTCATGG AGCCTGGAGC 

TGCTTCTATA AGAACGTGGT CCTGTATATT 

TTTTCTGGGC AGATTTTATT TGAACGTTGG 

GCTTTGCCGC CCTTCACTCT GGGAATCTTT 

AGGTTTCCCC AGCTCTACAA AATCACCCAG 

TGGGGTCACT GCATCAACGC CTTGGTCCAC 

GCTCTGGAGC ATGATACTGT GTTTGACAGT 

AATATTGTTT ACACATATGT TGTTGTTACT 

GCTTGGACTA AATTCAGTCA TCTGGCTGTC 

TTTGGCATCT ACTCGACCAT CTGGCCCACC 

GCAACTATGG TCCTGAGCTC CGCACACTTC 

TGTTTGATTG AAGATGTGGC ATGGAGAGCA 

GAGGAGGTGC AGGAGCTGGA AACCAAGTCT 

AGCAATGGAA AGAGGCTGAA CGAGCGCGAC 

CCCCCGACGC TGTTCCGGGG CAGCTCCCTG 

TCT CAAGAAG AACACGGAGC TGT TAGTCAG 

AAAAAGAAAT CCAGGAAGAA ATAAGACATG 

TCAGTTTGTT GCACCCAGTG TTAACACATC 

AAACACCAGG AAACACATTT CTGTGGCCTT 

TCGCAAACCT GGAGTGCAGA CCACAGGGGA 

GTGCTTAGCC TAACTTTTGT TTATGTCGTT 

TCAAATTAAA AACATTATGT TTCACCAATA 



Seq ID NO: 222 Protein sequence: 
Protein Accession #: NP 057613 



1 11 21 31 41 51 

I I I I I I 

MSVIVRTPSG RLRLYCKGAD NVIFERLSKD SKYMEETLCH LEYFATEGLR TLCVAYADLS 

ENEYEEWLKV YQEASTILKD RAQRLEECYE IIEKNLLLLG ATAIEDRLQA GVPET I ATLL 

KAEIKIWVLT GDKQETAINI GYSCRLVSQN MALILLKEDS LDATRAAITQ HCTDLGNLLG 

KENDVALI ID GHTLKYALSF EVRRSFLDLA LSCKAVICCR VSPLQKSEIV DWKKRVKAI 

TLAIGDGAND VGMIQTAHVG VGISGNEGMQ ATNNSDYA I A QFSYLEKIjLL VHGAWSYNRV 

TKCILYCFYK NWLYIIELW FAFVNGFSGQ ILFERWCIGL YNVIFTALPP FTLGIFERSC 

TQESMLRFPQ LYKITQNGEG FNTKVFWGHC INALVHSLIL FWFPMKALEH DTVFDSGHAT 

DYLFVGNIVY TYVWTVCLK AGLETTAWTK FSHLAVWGSM LTWLVFFGIY STIWPTIPIA 

PDMRGQATMV LSSAHFWLGL FLVPTACLIE DVAWRAAKHT CKKTLLEEVQ ELETKSRVLG 

KAVLRDSNGK RLNERDRLIK RLGRKTPPTL FRGSSLQQGV PHGYAFSQEE HGAVSQEEVI 

RAYDTTKKKS RKK 



Seq ID NO: 223 DNA sequence 
Nucleic Acid Accession #: BC017001 
Coding sequence: 1-3 94 

1 11 21 31 41 51 
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I I I I I I 

AACGCTGGGC AGGGCCGGCG CGGGTCGGGG GGCGCCCGAG GGGCCCGGGC CGAGCGGCGG 60 

CGCGCAGGGC GGCAGCATCC ACTCGGGCCG CATCGCCGCG GTGCACAACG TGCCGCTGAG 120 

CGTGCTCATC CGGCCGCTGC CGTCCGTGTT GGACCCCGCC AAGGTGCAGA GCCTCGTGGA 180 

CACGAT CCGG GAGGACCCAG ACAGCGTGCC CCCCATCGAT GTCCTCTGGA TCAAAGGGGC 240 

CCAGGGAGGT GACTACTTCT ACTCCTTTGG GGGCTGCCAC CGCTACGCGG CCTACCAGCA 300 

ACTGCAGCGA GAGACCATCC CCGCCAAGCT TGTCCAGTCC ACTCTCTCAG ACCTAAGGGT 360 

GTACCTGGGA GCATCCACAC CAGACTTGCA GTAGCAGCCT CCTTGGCACC TGCTGCCACC 420 

TTCAAGAGCC CAGAAGACAC ACCTGGCCTC CAGCAGGCTG GGCCATGCAG AAGGGAT AG C 480 

AGGGGTGCAT TCTCTTTGCA CCTGGCGAGA GGGTCTGACT CTGGGCACCC CTCTCACCGG 540 

CTACAAGGCC TTGGACTCAC TGTACAGTGT GGGAGCCCCA GTTCCCACCT CTGTGACAAT 600 

AGGATCATGG CCTTACCCTT GAAGCATTAC CGAGAAGGAG AACAGAGATG GGCTTGAAGA 660 

GCCACGTGCT GCCGGCTCCA AATTCCCAAG GACAAGGATC CCTCTGCATT TTTGTCTATG 72 0 

TAACCTCTTA TATGGACTAC ATTCAGCTGC AAGGAAAGGA AAACCTTGAT TGCAGTGGTT 780 

TAAACAAACA GAAGATTGTT T T T C C AC AT A GCATGGATTC TGGAGATGGG TGGCTAATGG 840 

TATTGGTTCA ACAACTCCAC GGAGGTAGGG GTCACGTCTT GGATCCTTTT GCCTTAATCT 90 0 

CAGTGCTCGT TACTTCATGG TCCCAAGATG GCTGCTGTAT CCCCAAGAAT CATGTCTGCG 960 

TTCAAGGAAG GAGGGGTGGA GGAAGAGGAA GGGCCAAACT AGCTGGACCC GTCACCTTCT 102 0 

AT CAGAAAGT AAAACCTCGT CAGAAGT CTG TTTCCTGCTC TCTCCCTCTG CATATCTTCA 1080 

CTTAGATGCC CTTGGCCCGA GCCAGCTACC ATTGCACCTC TAGCTGCAAA CAAAGCTAAG 1140 

ACAGCAGGGA ACAGAATTGT CATGGCTGAA TAGACCAATC GTGTTCCATC TACTGAGACT 1200 

GGCACACTGC CTCCTGCAAT AAAACTGGGA TCCCATTACC AAGAGAGAAA TGCAGAATTG 1260 

TGTACCAGTT AGCTTTTGCT GTGTAACAAA CCATCCCCAA ACTTGGCAGC TAGAAACAAA 1320 

CCCTGTATTT TCCCACAATC CTATGGGTTG GCAATTTGGG CTGGGCTCAA CAGGGCAGTT 13 80 

CTGCTGCTCA CACCTGGGAT CCCT CATGGA GCTAAGGTCA GCTGTTACCT CAGCTGGGCC 1440 

TGGATGGTCT AGGATAGCCT TACTCACTTG CCTGGCAGGT GACAGGCTGT TGGCTGGAAT 150 0 

TGCTTGGTTC TCCTCCATGT GGCCTCTCCA GCAGGCTAGC TCAGGCTTAT TCACATGATG 1560 

GCTTCAGGAT TCCAAAGAGA GTGAGAGTAG AAGCTGAAAG ACTTCTTGAG TTCTTGGCCT 162 0 

GGAACTGGGA CTAGGACAGT GTCACTTCTG CTAAGTTCTT TTGGTCAGAG CAAATCACAA 168 0 

GGCTTTACCC AGATTCAAGG GATGAGAAAC AGACTACATG TCTTGATGAG GGGAACCACA 1740 

AAGAGCTTGT GGCCATTTTT CACCTATCAC AAATAATTTT GGATGGGTAT TTATTTGGAT 1800 

AAAGGTATTT CCCTCTTCCC CCTTTCTCTC TGTCTCATGG GGCCTCACTC TGCCAAGTTG 1860 

GAAGGCACTA AGACATTGTC CTGGCCCTCA GGGTCTAGGG GAAGAGGTGT TGGGGCAGGA 192 0 

AGTGAGTCTC TCCATGGGCT GGAGCCACTG TAGTAGGAGT GCCTCCTTGT CTGCACTGCT 1980 

GGTATGGGGT TAGGCCAGGT AGGACATTCC AGAGGGGCTT CTGAAAACCA AGAGTCCCTG 2040 

GGGAAAGGGA ACAGAGTAAG GCAGGCCTTG TTCTCACTGC CCTCTAAGGG AACTTGGTCA 2100 

CTCGGCACTT TTAAGCCTCA GTTTCTCCAG TTCAATAATA AGGACAAGAG CTTTTCCCAT 2160 

GCATTCTCTT TCCCCGGGAA AGTTGACTGA GGTGACCAGT AATAGAATTG AAAAGGGAGA 222 0 

GTGTCTTCAG TGCAATGTGG CATCCTGGAT TGGGTCTTGG AACAAAAACA GGACATTAGT 22 80 

GGGAAAATTG GAAAT CTGAA AAAAGTCTGA ATTTTAGTTA ATATACCAAT TTCAGTCTCT . 2340 

TGGTTTTGAC AGATGTACCA TGGTGATGTA AGATGTTGAC CTTGGGGTAG GCTGGGTGAA 240 0 

GGGTATACAG GAACTCTTTG TACTATCTCT GCAACT TCT C TGTAAATCTA GTATCATTCC 2460 
AAAATAAAAG TTTATTTAAT TTAAAAAAAA AAAAAAAAAA AA 



Seq ID NO: 224 Protein sequence: 
Protein Accession #: AAH17001.1 

1 11 21 31 41 51 

11)111 

TLGRAGAGRG APEGPGPSGG AQGGSIHSGR IAAVHNVPLS VLIRPLPSVL DPAKVQSLVD 60 
TIREDPDSVP PIDVLWIKGA QGGDYFYSFG GCHRYAAYQQ LQRETIPAKL VQSTLSDLRV 120 
YLGASTPDLQ 

Seq ID NO: 225 DNA sequence 
Nucleic Acid Accession #: NM_021048 
Coding sequence: 1..1110 



1 11 21 31 41 51 

I I 1 I ! 1 

ATGCCTCGAG CT CCAAAGCG TCAGCGCTGC ATGCCTGAAG AAGATCTTCA AT CCCAAAGT 60 

GAGACACAGG GCCTCGAGGG TGCACAGGCT CCCCTGGCTG TGGAGGAGGA TGCTTCATCA 12 0 

TCCACTTCCA CCAGCTCCTC TTTTCCATCC TCTTTTCCCT CCTCCTCCTC TTCCTCCTCC 180 

TCCTCCTGCT ATCCTCTAAT ACCAAGCACC CCAGAGGAGG TTTCTGCTGA TGATGAGACA 240 

CCAAATCCTC CCCAGAGTGC TCAGATAGCC TGCTCCTCCC CCTCGGTCGT TGCTTCCCTT 300 

CCATTAGATC AAT CTGATGA GGGCTCCAGC AGCCAAAAGG AGGAGAGTCC AAGCACCCTA 360 

CAGGTCCTGC CAGACAGTGA GTCTTTACCC AGAAGTGAGA TAGATGAAAA GGTGACTGAT 420 

TTGGTGCAGT TTCTGCTCTT CAAGTATCAA ATGAAGGAGC CG AT CACAAA GGCAGAAATA 480 

CTGGAGAGTG TCATAAAAAA TTATGAAGAC CACTTCCCTT TGTTGTTTAG TGAAGCCTCC 540 

GAGTGCATGC TGCTGGTCTT TGGCATTGAT GTAAAGGAAG TGGATCCCAC TGGCCACTCC 600 

TTTGTCCTTG TCACCTCCCT GGGCCTCACC TATGATGGGA TGCTGAGTGA TGTCCAGAGC 660 

ATGCCCAAGA CTGGCATTCT CATACTTATC CTAAGCATAA TCTTCATAGA GGGCTACTGC 720 

ACCCCTGAGG AGGTCATCTG GGAAGCACTG AATATGATGG GGCTGTATGA TGGGATGGAG 780 

CACCTCATTT ATGGGGAGCC CAGGAAGCTG CTCACCCAAG ATTGGGTGCA GGAAAACTAC 840 

CTGGAGTACC GGCAGGTGCC TGGCAGTGAT CCTGCACGGT ATGAGTTTCT GTGGGGTCCA 900 

AGGGCTCATG CTGAAATTAG GAAGATGAGT CTCCTGAAAT TTTTGGCCAA GGTAAATGGG 960 

AGTGATCCAA GATCCTTCCC ACTGTGGTAT GAGGAGGCTT TGAAAGATGA GGAAGAGAGA 102 0 

GCCCAGGACA GAATTGCCAC CACAGATGAT ACTACTGCCA TGGCCAGTGC AAGTTCTAGC 1080 
GCTACAGGTA GCTTCTCCTA CCCTGAATAA 

Seq ID NO: 22 6 Protein sequence: 
Protein Accession #: NP_0663 86 

1 11 21 31 41 51 

| j I i i I 

MPRAPKRQRC MPEEDLQSQS ETQGLEGAQA PLAVEEDASS STSTSSSFPS SFPSSSSSSS 60 



276 



WO 02/086443 

SSCYPLIPST PEEVSADDET 
QVLPDSESLP RSEIDEKVTD 
ECMLLVFGID VKEVDPTGHS 
TPEEVIWEAL NMMGLYDGME 
RAHAEIRKMS LLKFLAKVNG 
ATGSFSYPE 



PNPPQSAQIA 
LVQFLLFKYQ 
FVLVTSLGLT 
HLIYGEPRKL 
SDPRSFPLWY 



CSSPSWASL 
MKEPITKAEI 
YDGMLSDVQS 
LTQDWVQENY 
EEALKDEEER 



PLDQSDEGSS 
LESVIKNYED 
MPKTGILILI 
LEYRQVPGSD 
AQDRIATTDD 



SQKEESPSTL 
HFPLLFSEAS 
LSIIFIEGYC 
PARYEFLWGP 
TTAMASASSS 



Seq ID NO : 227 DNA sequence 

Nucleic Acid Accession #: NM_005025.1 

Coding sequence: 82-1314 



GCGGAGCACA 
GAGGCTTGAA 
AGTATGGCTA 
TATAATCGTC 
GCTCTTGCAA 
CACTCAATGG 
TCAAACATGG 
GTGCAAAATG 
GCAGCAGTAA 
TGGGTGGAGA 
GCTGCCACTT 
TTTAGGCCTG 
ATTCCAATGA 
GAAGCTGGTG 
ATGCTGGTGC 
CAGCTGGTTG 
AGGTTCACAG 
GAAATTTTCA 
TCCAAAGCAA 
GTCTCAGGAA 
CATCCATTTT 
GTCATGCATC 
TTATTTGAAT 
TAGGATTTGT 
AATATATGTA 
TGTTATGTCA 



11 
I 

GTCCGCCGAG 
ACTGTTACAA 
CAGGGGCCAC 
TTAGAGCCAC 
TGGGAATGAT 
GATATGACAG 
TAACTGCTAA 
GATTT CATGT 
AT CATGTGGA 
ATAACACAAA 
ATCTGGCCCT 
AAAATACTAG 
TGTAT CAGCA 
GT AT CTACCA 
TGT CCAGACA 
AAGAATGGGC 
TGGAACAGGA 
TCAAAGATGC 
TTCACAAGTC 
TGATTGCAAT 
TCTTTCTTAT 
CTGAAACAAT 
AACAAGGAAA 
GTTTTACAGT 
AATTATAAGT 
TTGTGTTTGT 



21 
I 

CACAAGCTCC 
TATGGCTTTC 
TTTCCCTGAG 
TGGTGAAGAT 
GGAACTTGGG 
CCTAAAAAAT 
AGAGAGCCAA 
CAATGAGGAG 
CTTCAGTCAA 
CAATCTGGTG 
CATTAATGCT 
AACCTTTTCT 
AGGAGAATTT 
AGTCCTAGAA 
GGAAGTT CCT 
AAACTCTGTG 
AATTGATTTA 
AAATTTGACA 
CTTCCTAGAG 
TAGTAGGATG 
CAGAAACAGG 
GAACACAAGT 
ACAGTAACTA 
ATATCTTAAG 
AACTTGTCAA 
GTGCTGTTGT 



31 
I 

AGCATCCCGT 
CTTGGACTCT 
GAAGCCATTG 
GAAAATATTC 
GCCCAAGGAT 
GGTGAAGAAT 
TATGTGATGA 
TTTTTGCAAA 
AATGTAGCCG 
AAAGATTTGG 
GTCTATTTCA 
TTCACTAAAG 
TATTATGGGG 
ATACCATATG 
CTTGCTACTC 
AAGAAGCAAA 
AAAGATGTTT 
GGCCTCTCTG 
GTTAATGAAG 
GCTGTGCTGT 
AGAACTGGTA 
GGACATGATT 
AGCACATTAT 
ATAATATTTA 
GGAATGTTAT 
TTAAAATAAA 



41 
I 

CAGGGGTTGC 
TCTCTTTGCT 
CTGACTTGTC 
TCTTCTCTCC 
CTACCCAGAA 
TTTCTTTCTT 
AAATTGCCAA 
TGATGAAAAA 
TGGCCAACTA 
TATCCCCAAG 
AGGGGAACTG 
ATGATGAAAG 
AATTTAGTGA 
AAGGAGATGA 
TGGAGCCATT 
AAGTAGAAGT 
TGAAGGCTCT 
ATAATAAGGA 
AAGGCTCAGA 
ATCCTCAAGT 
CAATTCTATT 
TCGAAGAACT 
GTTTG CAACT 
AAATAGTTCC 
CAGTATTAAG 
AGTACCTATT 



51 
I 

AGGTGTGTGG 
GGTTCTGCAA 
AGTGAATATG 
ATTGAGTATT 
AGAAATCCGC 
GAAGGAGTTT 
TTCCTTGTTT 
ATATTTTAAT 
CAT CAATAAG 
GGATTTTGAT 
GAAGTCGCAG 
TGAAGTCCAA 
TGGCTCCAAT 
AAT AAG CAT G 
AG T CAAAG C A 
ATACCTGCCC 
TGGAATAACT 
GATTTTTCTT 
AGCTGCTGCT 
TATTGTCGAC 
CATGGGACGA 
TTAAGTTACT 
GGTATATATT 
AGATAAAAAC 
CTAATGGTCC 
GAACATGTG 



Seq ID NO: 228 Protein sequence: 
Protein Accession #: NP 005016.1 



MAFLGLFSL.L 
ELGAQGSTQK 
NEEFLQMMKK 
INAVYFKGNW 
VLEIPYEGDE 
I DLKD VLKAL 
SRMAVLYPQV 



11 

I 

VLQ SMATG AT 
EIRHSMGYDS 
YFNAAVNHVD 
KSQFRPENTR 
ISMMLVLSRQ 
GITEIFIKDA 
IVDHPFFFLI 



21 
I 

FPEEAIADLS 
LKNGEEFSFL 
FSQNVAVANY 
TFSFTKDDES 
EVPLATLEPL 
NI/TGL SDNKE 
RNRRTGTILF 



31 
I 

VNMYNRLRAT 
KEFSNMVTAK 
INKWVENNTN 
EVQIPMMYQQ 
VKAQLVEEWA 
IFLSKAIHKS 
MGRVMHPETM 



41 

I 

GEDENILFSP 
ESQYVMKIAN 
NLVKDLVSPR 
GEFYYGEFSD 
NSVKKQKVEV 
FLEVNEEGSE 
NTSGHDFEEL 



51 
I 

LSIALAMGMM 
SLFVQNGFHV 
DFDAATYLAL 
GSNEAGGIYQ 
YLPRFTVEQE 
AAAVSGMIAI 



Seq ID NO: 229 DNA sequence 
Nucleic Acid Accession #: NM_003695 
Coding sequence: 12-398 



11 



21 



31 



41 



51 



CGACATCAGA 
CAGCCCTTAC 
TCTGCCCGGC 
AT CTGGTGAA 
TCAGCAGCGG 
ACAACGCTGC 
TGAGCCTCCT 
TCATGCCTTT 
GGGTGCCAGG 
CATGGAATGC 
ACAGAGGATG 
GATTTCACAC 
TAAATGATTT 



GATGAGGACA 
CCTGCGCTGC 
CAGCTCTCGC 
GAAGGACTGT 
CACCAGCTCC 
ACCCACCCGC 
GGCCGTCATC 
CCTTCCCTTT 
AGCCCCAGGC 
TGATGACTTG 
CAGCCCCCAG 
TCCTTCTGTT 
AAACC 



GCATTGCTGC 
CACGTGTGCA 
TTCTGCAAGA 
GCGGAGTCGT 
ACCCAGTGCT 
ACCGCCCTCG 
TTAGCCCCCA 
CTCTGGGGAT 
TGAGGGCTTC 
GAGCAGGCCC 
CTGCATGGAA 
TTGTTGCCGT 



TCCTTGCAGC 
CCAGCTCCAG 
CCACGAACAC 
GCACACCCAG 
GCCAGGAGGA 
CCCACAGTGC 
GCCTGTGACC 
TCCACACCTC 
CCCGAAAGTC 
CACAGACCCC 
GGTGGAGGAC 
TTATTTTGTA 



CCTGGCTGTG 
CAACTGCAAG 
AGTGGAGCCT 
CTACACCCTG 
CCTGTGCAAT 
CCTCAGCCTG 
TTCCCCCCAG 
TCTTCCCCAG 
TGGGACCAGG 
ACAGAGGATG 
AGAAGCCCTG 
CTCAAATCTC 



GCTACAGGGC 
CATTCTGTGG 
CTGAGGGGGA 
CAAGGCCAGG 
GAGAAGCTGC 
GGGCTGGCCC 
GGAAGGCCCC 
CCGGCAACGG 
TCCAGGTGGG 
AAGCCACCCC 
TGGATCCCCG 
TACATGGAGA 



Seq ID NO: 23 0 Protein sequence: 
Protein Accession #: NP 003686 



1 11 21 31 41 51 

I 1 I I I I 

MRTAL.LLLAA LAVATGPALT LRCHVCTSSS NCKHSWCPA SSRFCKTTNT VEPLRGNLVK 

KDCAESCTPS YTLQGQVSSG TSSTQCCQED LCNEKLHNAA PTRTALAHSA LSLGLALSLL 

AVILAPSL 



Seq ID NO: 231 DNA sequence 

Nucleic Acid Accession # : Eos sequence 

Coding sequence: 126-752 



277 



10 



15 



20 



25 



30 



35 



40 



45 



WO 02/086443 

i li 

! I 

CCGGGCAGGT GGCTCATGCT 
AGGGGCGCAG GAATTCTGAT 
AGAAGATGAA GGATAT CGAC 
GTGTGAGGGA GAGAACCAGC 
GGAGAACTCG ACCGTTGGAA 
TCTCTCTTGA TGCCTCCATG 
GAAAGTACCA TCATGGCTTG 
ACCCAGTGGA CAATGCTGGG 
CCCGTGTGGC CCACAAGAAG 
ACGAGTCTTC TGACGTGAAC 
AAGTTGGGCC AGACGCTGCT 
TCATCCTGTC CATCGTGTGC 
TTCAGGATGG CTGTATTCTG 
CAAGAGTTCA GCCTTCCTTT 
TTCACTGCAC CGCCATCTTA 
TGACTCAGTT CCACATTTTG 
ACCAGCAACC CGGCTGTATA 
AGGGAGGGGA GAGGTGGAAT 
TTATTTCCTG GGACTTGGCA 
TCTGGTATTA ATTTAATCTC 
GGAATT CAGC GTAGCTACCT 
AGCTCTGACT TACAGCTGCA 
GGCTTCACAT CAATTTTTTT 
GTGGTTTTTT GTTTTATTTT 
CAGAAGGATG CCACCAGTTT 
GGTAATTCCT CACAACTTAG 
TGGGGAGCTT TTCGTTTTGT 
TCCTAGAGAA TCTACTCCGT 
TGCTGTCAGC CTGATATACT 
TTCTACTGTG TGTCGTTAAA 
TGTATAACTC GACTCTGTAT 
GTGTTTGTGA GATGCTCTTT 



21 
I 

CGGGAGCGTG 
GTGAAACTAA 
ATAGGAAAAG 
ACTTCTGGGA 
TGCCAAGATG 
CATTCTCAGC 
AGTGCTCTGA 
CTTTTTTCCT 
GGGGAGCTCT 
TGCAGAAGAC 
TCCCTGCGAA 
CTGATGATCA 
CGGTCAGAAT 
GGAGACTGCT 
CTGAGTTGCT 
GATTGCATAC 
CAGTGGTGAC 
ACAGTAGTTC 
AAAATCTGAT 
AGGAAAAACA 
CCAGACCGTG 
GTCACCTTTG 
CTTCCTTTAG 
TGTCAAGATT 
TTCCTTGAGG 
TGCACCAGTA 
TTTGTTTTTA 
TGCAGAATCA 
ACTTTGGACT 
CAACCGTCGG 
GTTTCAATGT 
GAAGATGGTA 



31 
I 

GTTGAGCGGC 
CAGTCTGTGA 
AGTATATCAT 
CGCACAGAGA 
CCTTGGAAAC 
TCAGAATCCT 
AGCCCATCCG 
GTATGACTTT 
CAATGGAAGA 
TAGAGAGACT 
GGGTTGTGTG 
CGCAGCTGGC 
GAGAGAGTCA 
CCATCAGTGC 
TCACGTGAGG 
TGGAAAAGAA 
CCAAGCAATG 
TTGGAATCTG 
TGGTGGGGAT 
AGAAATTAAC 
GTGTCTGGCC 
CTATAAGGCA 
GGTGGGGGAT 
GATTTTTAGA 
CCTAGGATTT 
GCACCAGCCA 
ATTCTCTTTC 
TTGCAACCTC 
CTGGAAACAG 
AGACCAGATG 
ATGTTACTGC 
CTTTTATATT 



41 
I 

TGGCGCGGTT 
GCCCTGGAAC 
CCCCAGTCCT 
CCGTGAAGAT 
AGCAGCCCGA 
GGATGAGGAG 
GACTACTTCC 
TTCGTGGCTT 
CGTGTGGTCT 
GTGG CAAGAA 
GATCTTCTGC 
TGGCTTCAGT 
AGCTGGGCAG 
CGAGGTGTGT 
AAAAGGGGGC 
GCCAATCTTC 
GATATAAACC 
AAGTCTCCTA 
CTCCTAGGAC 
CCAGAGAGAG 
TCCATTTTTG 
CCTGGGTAGA 
TGGTTTGGCT 
TGCAAGGACT 
TTTATTCTGT 
TTTTGAG CAG 
CTTAGCAGCA 
AGGAGCCCTC 
ATATGGGTTC 
ACCTGTTAGA 
AATGCTTCAC 
T 



51 
I 

GTCCTGGAGC 
CTCCACTCAG 
GGGTATAGAA 
TCCAAGTTCA 
GCCGAGGGCC 
CATCCCAAGG 
AAACACCAGC 
TCTTCTCTGG 
CTGTCCAAGC 
GAGCTGAATG 
CGCACCAGGC 
GGACCAAATT 
AATCTCTCGC 
GGGAACAGGC 
TTTGGCCCTG 
TTGCTAGTAA 
TAAAAATCTG 
TTTGATCAGG 
CTAGTGGACA 
TCTGGGTTTT 
TCTGTCATTC 
AGGGTGGATG 
TTCTTTTGTT 
TGAAAAGACC 
CCCGAGCAGA 
AGTACCTCTT 
AGGTCTTTTT 
ACTGATTGAG 
TATTCT CTAT 
TGGCTAGTCC 
CTGCTGTACA 



PCT/US02/12476 



Seq ID NO: 2 32 Protein sequence: 
Protein Accession # : Eos sequence 



11 



31 



41 



51 



21 

i 1 I I I 

MKDIDIGKEY IIPSPGYRSV RERTSTSGTH RDREDSKFRR TRPLECQDAL ETAARAEGLS 

LDASMHSQLR ILDEEHPKGK YHHGLSALKP IRTTSKHQHP VDNAGIiFSCM TFSWLSSL»AR 

VAHKKGELSM EDVWSLSKHE SSDVNCRRLE RLWQEELNEV GPDAASLRRV VWIFCRTRLX 

LSIVCLMITQ LAGFSGPNFQ DGCILRSE 

Seq ID NO: 2 33 DNA sequence 

Nucleic Acid Accession #: CAT cluster 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 



60 
120 
180 



50 



55 



60 



65 



70 



75 



80 



85 



TTTTAATGGT 
CACAACATGA 
TGTTTCTTAG 
TAGTAAACTT 
TTTGTTTCCA 
TGTTTGACTG 
TTGTTATGGT 
AAGCTATTTT 
TATATTATGG 
ATTAGCCTAC 
AATAGGTTAA 
AATTAAAGTA 
TATGAAAGCT 
TATATATTTT 
TATCCTGTAT 
TAGAAGACCC 
TTTTTTTTAG 
GATTCTGTTA 
TCCAGATAAA 
CTTAGGCTCT 
CCATAGTATC 
ACTATAATAG 
TATCAATGTT 
TACATAAAAA 
AAGTCATTAA 
AGAATCATCT 
GGAAGATGGA 
GAGTTGAAGA 
CTTTTAAAAC 
TATTCTTCTA 
AGCCCTTGTG 
CTGTTCAGGT 
TGAGATGGAG 
ATCATATGGA 
TTTTAATTCT 
CAATCCCCAA 
TTTCTGGAAT 



GCTCATATAT 
ATCACATAAT 
AT CGTAGTCA 
CTCTTTCATC 
AAGTCACAAT 
AAAGCAAAAC 
ATATCTTTTT 
AATCAT CAAG 
ATTAACCAGA 
TATAGTATTA 
AAAGTAGTTA 
CATTTTAAAT 
CTGGCTATCA 
TTAGTTCCTT 
TTTTTTTAAG 
ACTCTTACTA 
GTAGTTTAAA 
AGCAT CCAAA 
AGATGGAGAA 
CTCCATGTAT 
AAGTGGAGGG 
AAGTTTGAGT 
ATCCAATGAT 
GTGCTCATGT 
TAATTTAATA 
GAGGACTTTT 
GCCATGCTTG 
CCACTGCTCT 
TAGTAATGTA 
ATAACTAGCA 
TAAGATTATT 
GAGAAAACAT 
GAGGTGGGCA 
AGTTTGGAAA 
CACTGTCTCA 
GGGGCAGTGT 
TGCACCTACA 



21 
I 

ACTGTATTTT 
CATGATTTTT 
TTGAGAAGTC 
TTTGTGTTAG 
TGAATTATTC 
AACGTGACAG 
ATTAAATATT 
TATGGAAAAC 
ATTGTATCAT 
ATAAATTTTT 
CAAATTAAAC 
GAGCTTTATA 
TCCTGGGATA 
TGAGATAACT 
AATTGTTTTA 
GGTTCCCTAA 
GCAAGCACTG 
AACAATGCCT 
TACCTCATGT 
CTTTCTTAAG 
TAGTTCAGAA 
AATATTTTAA 
TTTTATTAAA 
ATTTGAATTT 
ATTGTTTTAA 
AATATGGAAT 
TTTTTCCAAA 
AAATTAGTGC 
CCCAGTTAAG 
TTTATTACAT 
ATTTCTTCTC 
AATGGATTTT 
CATTTAAGGT 
AGAGAGCTTA 
AAAGAGAATC 
TACCTTACTC 
TGTTTTCTTA 



31 



TTGTTGTTTA 
TTTTTTTACT 
CCAATAACTC 
CTCTGTAGTC 
TTAGATACCT 
TTTATTTTCA 
TATTTTGACT 
AAATTACTAT 
TTTTGGCCTA 
CAGTTGGTTT 
TTACTAATTT 
ATAC CTT AAA 
GTAATTTCTA 
AATTTCTAAT 
TAAATAGGTC 
GGATCTGCCA 
ATACCAGTGG 
AATTT CAGTT 
ACTGTGACTT 
GAAAAGTTTC 
AAGTTAATAG 
TAAATTTATA 
AAATTACCTT 
TAAATAATTT 
AT CAGTGGTT 
CCACCTCATA 
AGCTCTTTGA 
AGGAAAATGC 
TTTTGATGGT 
GAAATTTAAG 
TATAACTTCA 
TTTTTTTTTC 
CAGTTCACTA 
TCACAGGTTT 
AGCTCTCCAG 
CTTCACTGCT 
TTAACATTCA 



41 

I 

GTTTTACTTA 
TTTACTCCCC 
TAAACTTTTG 
TTAACCTGGA 
TAAGCCACTG 
AACACTAACT 
AAGCTTTCAT 
TGCATTTTCC 
ATGTCTGGAT 
GGGCAAATTT 
ATACCTGATT 
AAGTTGGTTC 
ATTATATAGT 
TATATATGTT 
ATAAGATACA 
TAGATTTTTT 
GAGTTGGTCT 
CTTAGGTTAT 
GAAAATGAAT 
TGAGTGTGAT 
GAAATCTTTT 
TAATTCAAAT 
ATTATTAGAA 
ATTTAAATCA 
TTCAACCCTC 
ACAATTAAGT 
GTGATTCTAA 
TTTTATTTCT 
TTAAATTCCA 
AGTTTAAGTT 
AAATAGATAT 
CTCTGGAGCT 
ACCTATGGTT 
GTATGCTGGT 
CAGTTCTAGA 
TCTTAGAAGG 
GAATTGGGAA 



51 
I 

TTGAGAGTGT 60 

AAATTATTCA 120 

AGTTATAACG 180 

TTTTAATTTT 240 

AATTCAGTTC 300 

TCT TGATATT 360 

AAAATATTTG 420 

TATATATGCA 480 

ATAAAAGATA 540 

AAACCTGAAA 600 

TTTTTTCTTG 660 

TAATTTAAAA 720 

ATTTCAAAAC 780 

TCAAAAACCA 840 

AGGTCTGCAT 900 

TTTTTTTTTT 960 

TGATCTAGGA 1020 

GGCTTGTGAC 1080 

TCTTAAAATT 1140 

CTCTCTTTTG 1200 

GTGACAGCAG 1260 

GATAAAAATG 1320 

CTGTGCCTAT 1380 

AGACCACCAT 1440 

ACTTCATATT 1500 

CTAAATTTCT 1560 

TTTGTAGTCA 1620 

CCCATGTTAA 1680 

CTAAAGAACA 1740 

CCATCAAACT 1800 

TTCATTCAAA I860 

GCCTGTTCAG 1920 

CAGAGTTCTG 1980 

GAATGGATAG 2040 

AAAGCTTTGA 210 0 

TAGAATTAAG 2160 

TATTAATTTT 2220 



278 



WO 02/086443 

TCCAGTGAGT AGTTTTCTGA AATTGGTAAC TTGGAGAGTA AAATAACGTA TTTTGCTTTT 22 80 

CAATTTTGTG TTTGTTTACT TTTATGTAAA AATTTGATAT GTGAATTACA CAGTTCTAAT 2340 

AAAACCTCAT GCCTTTTCAT TACATCTAAT TTGAACTCTC AACTTCAGTG CCAGAAGTGC 240 0 

TTTAAAGATG CTTTAATGAA AAGTATTAAG AAAATATATA GATTTGTATG TCAGTTTATA 2460 

CTT CAGAAAT CCATATATTT GTCATATTTA TTTTTTTAGA AACCTCCTAA TTGGATAACT 252 0 

AGATGGTATT TAAAATGAAT GCCCAAAAAT ATCTTGTACC TTTGTCCAAA AGTTTATCTG 2580 

TTGGAAGCCG CCAGCCATTC ATGTAGAGAG TTTATAAGAA AATAATTTAA AATTGTATGC 2 640 

ATTTTATATT ACTATGGTAT CTGTGTACCA TATTTCTAAG TATTCATTAT TAAATTGGTA 2700 

CTTCTTAAAA CCATAACCTG GCTTGCCTTT TAGTGTTAAA CACAAAATCC AACATTGTAT 2 760 

ATAGAGATTC TTCTTTTATG AAGAAGAGCT GACGTAATTT ATTACCAGTG CATCTGCACA 2 82 0 

AAGACATTAA CATAAGTCTC TGAGCAGTGA TACATTTTCA AACATGAAGA GTGACAACCA 2 880 

CCACATTAAA CAACCACGGC AACACTCAGA CTTGGCACTT TCCTACGAAT CCATCCTATA 2 940 

TGTGCCTGGT ATCGCCTCTG GCATAACTTA CACGAATCGT CCTCCCTACT TGTCTACGCT 3 000 

CCTTCAT CAA GCACTTGCCA ACACATTCAC CTCTAACTTG TACAACCTTA CCAACTCACC 3 060 

ACAACATCTG CAACTCTACC CTATCAACTG CCAACCTAAA GACCCCCAAC ACAACACAAC 312 0 

CCCCAAACAC AAAACCACTA AATCATAACC ACCACACACG CCACACACCA CACACCCACC 3180 

CACACAACCA ACACACCACG ACCAAACACC CCACCACAAA CAAGCTAACA ACCACAAACA . 3240 
GACAACACAT CACATACACT CACTACCCCC CCATACTCCC ACCCACCA 

Seq ID NO: 234 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 27-281 

1 11 21 31 41 51 

l l l l l I 

AGCAGGAGGA GAGCTGGCGG GAAGACATGC ACCCCTTGAA GACCCAGAGA GAGGCCGTCT 60 

GTCTACCGCG TAG C AGT T AC AT C AGACTGA GACACTTCCT GT T T AC AG GA G AC T AT AAAA 12 0 

TTCCTGCCCC GTGCTCATTT GGGGCTGACG CCATTTTAGG CCTCAGCCCA TCTGCACCCA 180 

GGCGCTCACT GAAACAGTGT GTTGCTCCAC ACCGCCTTGT TTTGCTTGTT GGCGCGCTCT 240 

CAGGGTTCCG ACCAATCCAA GAGCCTTGCA GAAAGCATTA ACGTGCTTTT CTCTTTGGCA 300 

GAGTTTTTCT TTGCTCTGAT CTTGGAGACA TCCCTCTGCC TAGTGGAAAC ATAAGGAATA 3 60 

CAGAAAGAAT GCAAGGAGAT AGACCAACGT GAGATTCTCC TTCATGCACT CAAGAGAAAG 42 0 

ATGTTGCAGG AAGAGCTAGT CTTTCAGGCT GGGCTGGTGA CCTGAGAAAG AATGTCCAGC 480 

TTTTCTTCTC CACTTGGCAT ATCAAGAGCC AGGCGTGGAA GACTAAAACA GGAAATGTTT 540 

ATAAAAACTG TTCAGCGGTT CGCCAACAAG AAGTGGTAAA GTAGCAAAAA TGGGGATGGA 600 

GATGCCAGGA GGAAAGATGC CAGGGGTAAA GTGGGAAAAT GGGAACCTGA AGCCAGGAGG 660 

TCAAGCCAAG CCAACAGGTG TTCTGTTTTT CAT CACAGAA CTAATAAGTG GTGCTGAGGA 720 

CTCAAACCCG GGGAAGCCCA CTCTAGAACC CATGCTGGTC ATCCATATCC CCAAGGCCCT 780 

GGTCAGAACA CAGCTAAGCA GATGGCTTGG GT CAT CAGGA CGTCCATTAC ATCCAAAGGA 840 

AG ACAG CCTG TGACGTTTCA AAAGCAAAAG TCCCCTACCA GCCAGTGAAG CTACCTGATT 900 

TCTCAGTATC TTACGCCCAG TGACACGATC TACCCTCAAA ACTTAAAAAA AAAAGGGAAA 960 

CATAAACACA TAACAGCAGC AGCAATAATT AAAGATGAGA TGAGAACAAT TAAGAAAAAA 1020 

GGAAAGGTCT CCTGTGACTG TTTTATTTTT AG GGAAACAG AGAGGAAGAA GAATGATTTT 1080 

TCTTTTGATG ACT CTATATC CAACTCTGAG GTTTGATTAA AGAAATGACC TTGAACCACA 1140 

GCAAAGAAAA ATAAAAGACA ATTTCCAGTA AGTATGCCAG TTCGAATTAA TGATTTACTT 1200 

TTTATTTTTA AACTGAATTC AGCAGAGATT TACATGCATT ACGATGATTA ACAT CTG AAA 12 60 

TTTGACCTTG AAATAATCTT TACATTGTAA ATTCTTAATG ATCAAAACAA GGTTCTCAGT 132 0 

GATTAAAACA TATTAGTAAT TAATTATTAA AGGAGAATAA TTGCAAATAC AACATTCCTA 1380 

AAATCTCAAG GCTTTTAAAG CATTTGTACA AATGACTGGA CATTTTTTAA ATTTGAAAAA 1440 

AAAAAAAAGC CCTCCATCTG ATTCTCATTT TCATTGTCAG TGCAACAACA AAAAAGGTAT 1500 

GCACTTCTCT TCTCATTTTC CACTGTCTCG CAAGCTAGAA ATT CTCACGA CTACCTTTGA 1560 

TCCCATCAAA GCCAAAGAAA GAAAAGAAAA TTGTTCTGTA CAGATATATG ACATTAAAAA 1620 
ATAATCCC 



Seq ID NO: 235 Protein sequence: 
Protein Accession #: Eos sequence 

1 11 21 31 41 51 

I I l l I I 

MHPLKTQREA VCLPRSSYIR LRHFLFTGDY KIPAPCSFGA DAILGLSPSA PRRSLKQCVA 60 
PHRLVLLVGA LSGFRPIQEP CRKH 

Seq ID NO: 236 DNA sequence 

Nucleic Acid Accession #: NM_002075 

Coding sequence: 406.. 1428 

1 11 21 31 41 51 

I I I I 1 I 

CCACAATAGG GGCAGACCTG TCCATCCTTC TCTGTGGGTC CCCTGTACCT TTCTCCCCCA 60 

AC AGGAT CAG ACCCAGAGGC AGCTGGTTGG GGTTTGTCGA GAAGAAGGAT TATCCAGATC 120 

AGTCCTTTCT AATCTCAGCT CCTGCCTGTA CCCTCCCATA CTCACCAAAC CCTCTTCCCC 180 

ACCACCCTGA GCTGAGGAGC ACAGTTTGAG GCCCCCCCAA CCCCCCGCCG GTCGGGGCCA 240 

GGCCAGGCCA GGCCAGCTCC TCTGGCAGCA GAGCCTGGGC AGGTGACGGG CGGGCGCGGG 300 

CGTCGCAGCT GAGGGAGTAA GGAGGCTCCC AGGAACCGGA GCTGGAAACC CGGCCGAGGT 360 

CCAGCCAGAG CCCAAGAGCC AGAGTGACCC CTCGACCTGT CAGCCATGGG GGAGATGGAG 420 

CAACTGCGTC AGGAAGCGGA GCAGCTCAAG AAGCAGATTG CAGATGCCAG GAAAGCCTGT 480 

GCTGACGTTA CTCTGGCAGA GCTGGTGTCT GGCCTAGAGG TGGTGGGACG AGT CCAGATG 540 

CGGACGCGGC GGACGTTAAG GGGACACCTG GCCAAGATTT ACGCCATGCA CTGGGCCACT 600 

GATTCTAAGC TGCTGGTAAG TGCCTCGCAA GATGGGAAGC TGATCGTGTG GGACAGCTAC 660 

ACCACCAACA AGGTGCACGC CATCCCACTG CGCTCCTCCT GGGTCATGAC CTGTGCCTAT 720 

GCCCCATCAG GGAACTTTGT GGCATGTGGG GGGCTGGACA ACATGTGTTC CATCTACAAC 780 

CTCAAATCCC GTGAGGGCAA TGTCAAGGTC AGCCGGGAGC TTTCTGCTCA CACAGGTTAT 840 

CTCTCCTGCT GCCGCTTCCT GGATGACAAC AATATTGTGA CCAGCTCGGG GGACACCACG 900 

TGTGCCTTGT GGGACATTGA GACTGGGCAG CAGAAGACTG TATTTGTGGG ACACACGGGT 960 

GACTGCATGA GCCTGGCTGT GTCTCCTGAC TTCAATCTCT TCATTTCGGG GGCCTGTGAT 1020 

GCCAGTGCCA AGCT CTGGGA TGTGCGAGAG GGGACCTGCC GTCAGACTTT CACTGGCCAC 1080 



279 



WO 02/086443 

GAGTCGGACA TCAACGCCAT CTGTTTCTTC 
GATGACGCTT CCTGCCGCTT GTTTGACCTG 
CACGAGAGCA TCATCTGCGG CATCACGTCC 
TTCGCTGGCT ACGACGACTT CAACTGCAAT 
GGCATCCTCT CTGGCCACGA TAACAGGGTG 
GCTGTGGCCA CAGGTTCCTG GGACAGCTTC 
AAGGGAAGTG GAAGGCAGTG AACACACTCA 
GGTGTTCTCT TCTATATTCC GGGTGCCATT 
GGGAGCATGG GACTGTGCCT TTGGGAGGCA 
CCATCTCCTC CCATGGCCTT CCCTCCCCAC 
GGACAACCTG CCCCTCCCCA GCCCTTTGCA 
GCCCTAGGAT TCCTCCCCCA GAGCCACTAC 
TTGGCCCTGT GACTATGGCT CTGGCACCAC 
TTCTCCTTTT TCTACCTTTT TTTCTCTCCT 
GT 



CCCAATGGAG AGGCCATCTG CACGGGCTCG 1140 

CGGGCAGACC AGGAGCTGAT CTGCTTCTCC 120 0 

GTGGCCTTCT CCCTCAGTGG CCGCCTACTA 1260 

GTCTGGGACT CCATGAAGTC TGAGCGTGTG 132 0 

AGCTGCCTGG GAGTCACAGC TGACGGGATG 1380 

CTCAAAATCT GGAACTGAGG AGGCTGGAGA 1440 

GCAGCCCCCT GCCCGACCCC ATCTCATTCA 1500 

CCCACTAAGC TTTCTCCTTT GAGGGCAGTG 1560 

GCATCAGGGA CACAGGGGCA AAGAACTGCC 162 0 

AGTCCTCACA GCCTCTCCCT TAATGAGCAA 1680 

GGCCCAGCAG ACTTGAGTCT GAGGCCCCAG 1740 

CTTTGTCCAG GCCTGGGTGG TATAGGGCGT 1800 

TAGGGTCCTG GCCCTCTTCT TATTCATGCT 18 60 

AAGACACCTG CAATAAAGTG TAGCACCCTG 192 0 



Seq ID NO: 237 Protein sequence: 
Protein Accession #: NP_002066 

1 11 21 31 41 51 

( | I I 1 I 

MGEMEQLRQE AEQLKKQIAD ARKACADVTL AELVSGLEW GRVQMRTRRT LRGHLAKIYA 60 
MHWATD SKLL VSASQDGKLI VWDSYTTNKV HAIPLRSSWV MTCAYAPSGN FVACGGLDNM 120 
CSIYNLKSRE GNVKVSRELS AHTGYLSCCR FLDDNNIVTS SGDTTCALWD IETGQQKTVF 180 
VGHTGDCMSL AVSPDFNLFI SGACDASAKL WDVREGTCRQ TFTGHESDIN AICFFPNGEA 240 
ICTGSDDASC RLFDLRADQE LICFSHESII CGITSVAFSL SGRLLFAGYD DFNCNVWDSM 3 00 
KSERVGILSG HDNRVSCLGV _ TADGMAVATG SWDSFLKIWN 



Seq ID NO: 238 DNA sequence 

Nucleic Acid Accession #: CAT cluster 



1 11 21 31 41 51 

I I I I I I 

TCCCAATGTG TNGAACCTAC CATAAATTCT TTTCTTACNG GACAATCTTA TNCTAANCAA 60 

TACCATTTGC TTTTAAGGCA GATAATCCTC CAAGTTTTCT AATGATATCT GAAACTAT T A 120 

ACTGATTCTG TGAATTATGA AATCTGAAAA GGAATTGGAA GTTGCTAAAA ATCTATCATT 180 

TGCATTGACC AGTGTGAAGC ACAGTGGAAT GAGAATGCGT GCCCTGACAC CAAAGAAAAA 240 

TAAGTGACTG GAAAGCTGAA GAATCACCGG CTTCAGTGAC ATGGAACCCA GTGATTTGAT 3 00 

TTTTGACGAG TAT CGGGTG A CTTTGAGGTG GT CAAGAAAC CACACTTTAA GAACAATGTC 3 60 

CAAAAAGGGG AAAAAAAAGA GCAACCAAAG AAAAAAAATC CAT AAAAT T G CACAGAAGAA 42 0 

AAGAAAGAAA AATAAAATAC ACAATATGGA CGATGGAGAA AAACAGTTAC ATTTCTTTAT 480 

GGATCAAGAA GTTTGTGTAC ACATAATCTC ATTTTGAGAT ATATAACTAT TTTTGTCTTT 540 

CAGAAGTGAA T CAAAAT ATT TCAAAATGCT GT CTTATGAA ACTACAATAT TC T CAC AG AT 600 

TAGAAAAGTT TTTCTGTAAA AGTCAGATAG TAAATATTTT AGGTTTTGCA GTGTCTTTTG 660 

CAACTACTCA ACTTTCCTAC TGTAGCACAA GAGTAGCTGT GGTACTGTGC AAATAAATTG 72 0 

CTTGTGTTCC AATAAAGCTT CATTTACAAA AACATGCCAT GGGCCATATT TGGCCTGTAC 7 80 

ACTGTTGTTT GCCAAGTCCT AATATAGTTG CTTAGCAAGT ATTGTGAGCT AT T T GAG G AA 840 

GACATGAAAG TTCATTGGGT TGCTAAAAAG TATGTAGAAA TTCAAAGGAA AATTAAAATT 900 

TAGGCTAAGT TATAATACAC TGTTTTAACA ATTGTAAAAT GTAAGAGAAA TTTACAAATA 960 
AAAATCCCAA ATAAAA 



Seq ID NO: 239 DNA sequence 

Nucleic Acid Accession #: NM_001786 . 1 

Coding sequence: 130-1023 

1 11 21 31 41 . 51 

! | I I I I 

GGGGGGGGGG GGCACTTGGC TTCAAAGCTG GCTCTTGGAA ATTGAGCGGA GAGCGACGCG 60 

GTTGTTGTAG CTGCCGCTGC GGCCGCCGCG GAATAATAAG CCGGGATCTA CCATACCCAT 120 

TGACTAACTA TGGAAGATTA TACCAAAATA GAG AAAAT TG GAGAAGGTAC CTATGGAGTT 180 

GTGTATAAGG GTAGACACAA AACTACAGGT CAAGTGGTAG CCATGAAAAA AATCAGACTA 240 

GAAAGTGAAG AGGAAGGGGT TCCTAGTACT GCAATTCGGG AAATTTCTCT ATTAAAGGAA 300 

CTTCGTCATC CAAATATAGT CAGTCTTCAG GATGTGCTTA TGCAGGATTC CAGGT TAT AT 3 60 

CTCATCTTTG AGTTTCTTTC CATGGAT CTG AAGAAATACT TGGATTCTAT CCCTCCTGGT 42 0 

CAGTACATGG ATTCTTCACT TGTTAAGAGT TATTTATACC AAATCCTACA GGGGATTGTG 480 

TTTTGTCACT CTAGAAGAGT TCTTCACAGA GACTTAAAAC CTCAAAATCT CT T GAT TG AT 540 

GACAAAGGAA CAATTAAACT GGCTGATTTT GGCCTTGCCA GAGCTTTTGG AATACCTATC 600 

AGAGTATATA CACATGAGGT AGTAACACTC TGGTACAGAT CTCCAGAAGT ATTGCTGGGG 660 

TCAGCTCGTT ACTCAACTCC AGTTGACATT TGGAGTATAG GCACCATATT TGCTGAACTA 720 

GCAACTAAGA AACCACTTTT CCATGGGGAT TCAGAAATTG ATCAACTCTT CAGGATTTTC 780 

AGAGCTTTGG GCACTCCCAA TAATGAAGTG TGGCCAGAAG TGGAATCTTT ACAGGACTAT 840 

AAGAATACAT TTCCCAAATG GAAACCAGGA AGCCTAGCAT CCCATGTCAA AAACTTGGAT 900 

GAAAATGGCT TGGATTTGCT CTCGAAAATG TTAATCTATG ATCCAGCCAA ACGAATTTCT 960 

GGCAAAATGG CACTGAATCA TCCATATTTT AATGATTTGG ACAATCAGAT TAAGAAGATG 1020 

TAGCTTTCTG ACAAAAAGTT TCCATATGTT ATGTCAACAG ATAGTTGTGT TTTTATTGTT 10 80 

AACTCTTGTC TATTTTTGTC T TAT AT AT AT TTCTTTGTTA TCAAACTTCA GCTGTACTTC 1140 

GTCTTCTAAT TTCAAAAATA TAACTTAAAA ATGTAAATAT TCTATATGAA TTTAAATATA 12 00 
ATTCTGTAAA TGTGAAAAAA AAAAAAAAAA AAAAA 



Seq ID NO: 240 Protein sequence: 
Protein Accession #: NP_001777-1 

1 11 21 31 41 51 

] 1 I I I I 

MEDYTKIEKI GEGTYGWYK GRHKTTGQW AMKKIRLESE EEGVP STAIR EISLLKELRH 60 
PNIVSLQDVL MQDSRLYLIF EFLSMDLKKY LDSIPPGQYM DSSLVKSYLY QILQGIVFCH 120 



280 
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SRRVLHRDLK PQNLLIDDKG T I KL AD F GL A RAFGIPIRVY THEWTLWYR SPEVLLGSAR 
YSTPVDIWSI GTIFAELATK KPLFHGDSEI DQLFRIFRAL GTPNNEVWPE VESLQDYKNT 
FPKWKPGSLA SHVKNLDENG LDLLSKMLIY DPAKRISGKM ALNHPYFNDL DNQIKKM 



180 
240 



PCT/US02/12476 



10 



15 



20 



25 



30 



Seq ID NO: 241 DNA sequence 

Nucleic Acid Accession #: NM_033379.1 

Coding sequence : 132-854 



CGCCCGCGCG 
GCTTTGCAGA 
ATTGACTAAC 
TTGTGTATAA 
TAGAAAGTGA 
AACTTCGTCA 
ATCTCATCTT 
GTCAGTACAT 
TATTGCTGGG 
TTGCTGAACT 
TCAGGATTTT 
TACAGGACTA 
AAAACTTGGA 
AACGAATTTC 
TTAAGAAGAT 
TTTTTATTGT 
AGCTGTACTT 
ATTTAAATAT 



11 

3 

CGGGCTCAAC 
GAGCGCCCTC 
TATGGAAGAT 
GGGTAGACAC 
AGAGGAAGGG 
TCCAAATATA 
TGAGTTTCTT 
GGATTCTTCA 
GTCAGCTCGT 
AGCAACTAAG 
CAGAGCTTTG 
TAAGAATACA 
TGAAAATGGC 
TGGCAAAATG 
GTAGCTTTCT 
TAACTCTTGT 
CGTCTTCTAA 
AATTCTGTAA 



21 

•I 

TTTGTAGAGC 
CAGGGACTAT 
TATACCAAAA 
AAAACTACAG 
GTTCCTAGTA 
GTCAGTCTTC 
TCCATGGATC 
CTTGTTAAGG 
TACT CAACTC 
AAACCACTTT 
GGCACTCCCA 
TTTCCCAAAT 
TTGGATTTGC 
GCACTGAATC 
GACAAAAAGT 
CTATTTTTGT 
TTT CAAAAAT 
ATGTGAAAAA 



31 



GAGGGGCCAA 
GCGTGCGGGG 
TAGAGAAAAT 
GTCAAGTGGT 
CTGCAATTCG 
AGGATGTGCT 
TGAAGAAATA 
TAGTAACACT 
CAGTTGACAT 
TCCATGGGGA 
ATAATGAAGT 
GGAAACCAGG 
TCTCGAAAAT 
ATCCATATTT 
TTCCATATGT 
CTTATATATA 
ATAACTTAAA 
AAAAAAAAAA 



41 
I 

CTTGGCAGAG 
ACACGGGATC 
TGGAGAAGGT 
AGCCATGAAA 
GGAAATTTCT 
TATGCAGGAT 
CTTGGATTCT 
CTGGTACAGA 
TTGGAGTATA 
TTCAGAAATT 
GTGGCCAGAA 
AAGCCTAGCA 
GTTAATCTAT 
TAATGATTTG 
TATGTCAACA 
TTTCTTTGTT 
AATG TAAAT A 
AAAAAA 



51 
I 

CGCGCGGCCA 60 

TACCCATACC 120 

ACCTATGGAG 180 

AAAAT C AG AC 240 

CTATTAAAGG 3 00 

TCCAGGTTAT 3 60 

ATCCCTCCTG 420 

TCTCCAGAAG 480 

GGCACCATAT 54 0 

GATCAACTCT 600 

GTGGAATCTT 660 

TCCCATGTCA 72 0 

GAT CCAG CCA 780 

GACAAT CAGA 840 

GATAGT TGTG 90 0 

ATCAAACTTC 960 

TTCTATATGA 102 0 



Seq ID NO: 242 Protein sequence: 
Protein Accession #: NP 203698.1 



35 



ii 



21 



31 



41 



51 



40 



45 



50 



55 



60 



65 



70 



75 



80 



MEDYTKIEKI GEGTYGWYK GRHKTTGQW AMKKIRLESE EEGVPSTAIR EISLLKELRH 
PNIVSLQDVL MCjDSRLYLIF EFLSMDLKKY LDSIPPGQYM DSSLVKWTL WYRSPEVLLG 
SARYSTPVDI WSIGTIFAEL ATKKPLFHGD SEIDQLFRIF RALGTPNNEV WPEVESLQDY 
KNTFPKWKPG SLASHVKNLD ENGLDLLSKM LIYDPAKRIS GKMALNHPYF NDLDNQIKKM 

Seq ID NO: 243 DNA sequence 

Nucleic Acid Accession #: AF101051.1 

Coding sequence: 221-856 



11 



85 



GAGCAACCTC 
CGACCCAGAG 
GCGGGGCCCA 
ACCTGCCACC 
GCTGTTGGGC 
GCCCCAGTGG 
CGAGGGGCTG 
TGACTCCTTG 
CATCCTCCTG 
CTTGGAAGAC 
TCTTGCAGGT 
ATT CTATGAC 
TGGCTGGGCT 
CCGAAAAACA 
GAAAGACTAC 
GGACATTGAG 
GTATGGTATT 
AAACATGGCT 
TTGTATTACT 
TATATATAGA 
CTCATTATGT 
CCATATTGAT 
CAGTCAAATA 
CTAATTTACC 
TTATTTTTTA 
TTTCATTGGT 
AGCCAAGAAG 
GTGATAAATT 
TTTGCTTTGA 
CACAACTTTA 
ACCTTTTTGT 
TATATCTTCC 
GATAATCTGG 
TCTTTTTTCT 
AATATTAATT 
TTTATTTGCT 
CTTCATGTGA 
ACACATACCT 
AAACCTACGC 
ATTCTTTCAG 
TTTCCAGTCT 



AGCTTCTAGT 
CTTCTCCAGC 
GCCACCTTCG 
CCTGAGCCAG 
TTCATTCTCG 
AGGATTTACT 
TGGATGTCCT 
CTGAATCTGA 
GGAGTGATAG 
GATGAGGTGC 
CTGGCTATTT 
CCTATGACCC 
GCTGCTTCTC 
ACCTCTTACC 
GTGTGACACA 
ATACTATCAT 
ACAAAACAAA 
TAATCTTATT 
GCTTCCCATT 
TATGTATATA 
TGATACTAGC 
GAAGATGTTT 
TCATTTACTC 
AAGGATGAAT 
CCATAATCTT 
CTCTATCTCC 
AATTTATTAC 
CCTGTTGACC 
AAATATTTGT 
TTGATTGAAT 
TCCCCATTCC 
TAATAAGGTG 
TGACAAATAT 
ATCTGCCAAA 
AGTTTATATT 
CAGCTGGCTG 
TTCACTGCCT 
TCATGTGGTT 
ACATACCTTC 
CTGTGTCTGA 
GTACAGAATG 



21 

I 

ATCCAGACTC 
GGCGGCGCAG 
GGAGTCCGGG 
CGCGGGCGCC 
CCTTCCTGGG 
CCTATGCCGG 
GCGTGTCGCA 
G CAGCAC ATT 
CAATCTTTGT 
AGAAGATGAG 
TAGTTGCCAC 
CAGTCAATGC 
TCTGCCTTCT 
CAACACCAAG 
GAGGCAAAAG 
TAACATTAGG 
CAAACAAACA 
TTATCTTCTT 
GAGTAATCAT 
TACATGTTTT 
ATACTTAAAA 
ATTGGTATAT 
TTCTTCATTA 
TCTTTCAATT 
ATAGCACTTG 
TGAATCTAAC 
AAATCAGAAC 
TTCCCACACA 
CCAATTGAGT 
TTTTAAGCTA 
TTAATTGTAT 
TGGTCTGTTT 
TCTCTCTGTA 
TTGAGATAAT 
ACTCTCATTC 
AGACACTGAA 
TCCTCTCTCT 
CAGTGCCTTC 
ATGTGGCTCA 
CATGTTTGTG 
CTATTTCACT 



31 
! 

CAGCGCCGCC 
CGAGCAGGGC 
TTGCCCACCT 
CGAGCGAGTC 
ATGGATCGGC 
CGACAACATC 
GAGCACCGGG 
GCAAGCAACC 
GGCCACCGTT 
GATGGCTGTC 
AGCATGGTAT 
CAGGTACGAA 
GGGAGGTGCC 
GCCCTATCCA 
GAG AAAAT CA 
ACCTTAGAAT 
AAAAACCCAT 
TCCTCAATAT 
ACTCAAATGG 
TCTATTAAAA 
TATCTCTAAA 
TTTCTTTTTC 
GCTTTGGGTG 
CTTCATGCGT 
CAT CGTTATT 
ACATTTCATA 
TTTGGAGGCA 
ATCCCTGTAC 
AGCTGCATGC 
CTTATTCATA 
TGTTTTCCCA 
GTCTGAACAA 
GCTGTAAGCA 
GATACTTAAC 
TTTGAACATG 
GAAGTCACTG 
ACCAGTCTAT 
CTCTCTCTAC 
GTGCCTTCCT 
CTCTGTTCCA 
TG AG CAAGAT 



41 
I 

CCGGGCGCGG 
TCCCCGCCTT 
GCAAACTCTC 
ATGGCCAACG 
GCCATCGTCA 
GTGACCGCCC 
CAGATCCAGT 
CGTGCCTTGA 
GGCATGAAGT 
ATTGGGGGTG 
GGCAATAGAA 
TTTGGTCAGG 
CTACTTTGCT 
AAACCTGCAC 
TGTTGAAACA 
TTTGGGTATT 
GTGTTAAAAT 
AGGAGGGAAG 
GGGAAGGGGT 
ATAGACAGTA 
ATAGGTAAAT 
GTCCTTATAT 
CCTTTGCCAC 
GCCCTTTTCA 
AAGCCCTTAT 
GCCTACATTT 
AAT CTTTCTG 
TCTGACCCAT 
TGTTCCCCCA 
GTTTTATATC 
AGTGTAATTA 
AGTGCTAGAC 
AGTCACTTAA 
CAGTTAGAAG 
AACTATGCCT 
AACAAAACCT 
TTCCACTGAA 
CAGTCTATTT 
CTCTCTACCA 
TTTTAACAAC 
GATGTATGGA 



51 
I 

ACCCCAACCC 
AACTTCCTCC 
CGCCTTCTGC 
CGGGGCTGCA 
GCACTGCCCT 
AGGCCATGTA 
GCAAAGTCTT 
TGGTGGTTGG 
GTATGAAGTG 
CGATATTTCT 
TCGTTCAAGA 
CTCTCTTCAC 
GTTCCTGTCC 
CTTCCAGCGG 
AACCGAAAAT 
GTAATCTGAA 
ACTCAGTGCT 
ATTTTACCAT 
GCTCCTTAAA 
AAATACTATT 
GT AT T T AAT T 
ACATATGTAA 
AAGACCTAGC 
TATACTTATT 
TTGTTTTGTG 
TAGTTTCTAA 
CATGACCAAA 
AGCACTCTTG 
GGTGTTGTAA 
CCCCTAAACT 
TCATGCGTTT 
TTTCTGGAGT 
TCTTTCTACC 
AGGTAGTGTG 
ATGTAGTGTC 
ACACACGTAC 
CAAAACCTAC 
CCACTGAACA 
GTCTATTTCC 
TGCTCTTACT 
AAGGGTGTTG 



60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 



281 



10 



15 



WO 02/086443 

GCACTGGTGT CTGGAGACCT 
AGCAAGGCAT TTGGCTGCTG 
CTGATCTTCC CACCTCACAG 
GTGGTTTTGT AATTTGAAAA 
CGTTTTGGTG TTGCTTTTCA 
GCCTTAACCA GTCTCTCAAG 
AAGATTCTGA GGAAGT CTTA 
ACAGATGTAA TGGGAAGAAA 
TTTTGAATCA TAATAACTCA 
TGTTAGCTGG CAGCTGACGC 
CTACACAAGG AAAGTCAGCC 
TGCCTTCCAA ACCTGAGAAT 
ATACATAGAT CTTCATGATG 
ACAAAAAAAT TTTATGGCCC 
TTTGATCTTT TTATATTCTT 
TTATAATGGG AATTTGTATA 
AAAAGGAAAA AAAAAAAAAA 



PCT/US02/12476 



GGATTTGAGT 
TAAGCTTATT 
TGATGTTGTG 
GTGCTATACT 
AATGTTTGAA 
TGATGAGACA 
TCTTCTGCAG 
TAAAAGCCTA 
TAAGGTGCTA 
TGCTAGGATA 
ACCGTGTCTT 
ATATGCTTTT 
TGTGAGTGTA 
AAAATGACCA 
CTACCACACC 
AAGCATTACT 
AAA 



CTTGGTGCTA 
GCTTCATCTG 
GGGAT CCAGT 
AAGGGAAAGA 
AATAAAAAAA 
GTGAAGTAAA 
TGAGTATGGC 
CGTGTTGGTA 
TCTGTTCAGT 
GTTAGTTTGG 
ATGAGGAATT 
GGAAGTTAAA 
ATTCCATGTG 
ACGAAATTGT 
TGGAAACAGA 
CTTTTTCAAT 



TCAATCACCG 
TAAGCGGTGG 
GAGATAGAAT 
ATTGAGGAAT 
TGTTAAGAAA 
ATTGAGTGCA 
CCAATGCTTT 
AATCCAACAG 
GATGCCCTCA 
AAATGGTACT 
GGACCTAATA 
ATTTAAATGG 
GATATCAGTT 
TACAATAGAA 
CCAATAGACA 
AAATTGTTTT 



TCTGTGTTTG 252 0 

TTTGTAATTC 2580 

ACATGTAAGT 2640 

TAACTGCATA 2700 

TGGGTTTCTT 2760 

CTAAACGAAT 2820 

CTGTGGCTAA 2 880 

CAAGGGAGAT 2 940 

GAGCTCTTGC 3 0 00 

TCATAATAAA 3 0 60 

AATTTTAGTG 3120 

CTTTTGCCAC 3180 

ACCAAACATT 3240 

TTTATCCAAT 3300 

TTTTGGGGTT 3360 

TTAATTTAAA 3420 



20 Seq ID NO: 244 Protein sequence : 
Protein Accession #: AAD16433.1 



1 11 21 31 41 51 

ryt- I I I I I I 

2 J MANAGLQLLG FILAFLGWIG AIVSTALPQW RIYSYAGDNI VTAQAMYEGL WMSCVSQSTG 

QIQCKVFDSL LNLSSTLQAT RALMWG I IiL GVIAIFVATV GMKCMKCLED DEVQKMRMAV 

IGGAIFLLAG LAILVATAWY GNRIVQEFYD PMTPVNARYE FGQALFTGWA AASLCLLGGA 

LLCCSCPRKT TSYPTPRPYP KPAPSSGKDY V 

30 Seq ID NO: 245 DNA sequence 

Nucleic Acid Accession #: CAT cluster 



60 
120 
180 



35 



40 



tp tp 

TTAATGGTTA 
AGCATGGTCC 
TTTTCTTCCT 
CAGTTGTTAT 
AGGTGGGGAG 
TTAATAGCCA 
GTCCTACGCC 



11 
I 

TTTTTTTTTT 
AATGCTGTTT 
CGAGAGTCTG 
GAGATTTAGT 
GAAGAATGCA 
GTCGCTCAAG 
CTGCACTTCA 
CACGGAGTCT 



21 
I 

TTTTTCAAGG 
ACCAAGTGAC 
ACAAACCTCA 
TTCTTCATCG 
TATATTAGAA 
CCCAGGAATT 
GCCTGGGCAA 
CGCTGATTGC 



31 

AGAGCACAAG 
CCAGAGGCAG 
GTTCAAATCC 
TTAACAATGA 
TGCCTGTAGT 
CAAAGCTGCA 
TGTAGTAAGA 
TAGCACAGCA 



41 


51 




1 

GAACTTTATT 


1 

AATGACTTTC 


60 


CGTGGTTTAG 


TGGTTTCAAC 


120 


TTCTTTTGTC 


TTCACTTAGT 


180 


GGATATTAAT 


ATGTTTCACA 


240 


CTCAGCTACT 


CAGGAGGCTA 


300 


ATGCATTATG 


ATTACAGCTG 


360 


TCCCATCTCT 


GGCTCGGAGG 


420 


GTCTGAGATC 


AAACTGCA 





Seq ID NO: 246 DNA sequence 
45 Nucleic Acid Accession #: XM_058553.2 
Coding sequence: 897-1400 



50 



55 



60 



65 



70 



75 



1 

I 

AATTTTCAGA 
TAAATGTATT 
GTGAAACCAT 
CTGTTAT CCA 
ATAGAGGGAA 
TGGGATGAGA 
GATCATGTTT 
GTTGAGTGTA 
ACTGGTAACC 
TTATTTCTGT 
TTGTCCAGGC 
GCCTTTGCCT 
TTTTTTTGTT 
TAGTCTTGCT 
CAGCCTCCCA 
AAGAAACTTA 
ACCATCAAAT 
CTGATGTTGC 
CTGAAATTAG 
TCAACCAAAC 
CTTGCGATGA 
GCACAACTCA 
ATAACCTGGC 
ACAATGGAAA 
GTTGCTTCTT 
AACTCCCTGT 
TTTAATGCAA 



11 
I 

AGTTTCGTAT 
TAGTCT CAGT 
TTCTCTTTTA 
TAATATGGAC 
TGAGTATTAA 
GGAGGTGAAA 
AAGAAAAGTC 
TACTGTCTGT 
TGCCTATCTG 
GTTTATGTAT 
CAAGTGCAAT 
CCTGAGTAGC 
TGTTTGTTTG 
TTGTTGCCAG 
GAGTGCTAGG 
CACCGACTCC 
CAGGGCTTGC 
AAGCAAATTG 
TCATCATATC 
CAGGAGCCTT 
AGACTGGGAT 
CTACTCTGAC 
TTCAGGCATG 
TGCACAGTAA 
CTTCTACCAG 
GACTTTCCAA 
GAACCCTCAT 



21 
I 

GGGGATGGTT 
GCTCAATAGA 
ATGTTTCACA 
AGTTCTTGAG 
TTGGAGAAGC 
CCTCACTAGA 
ATGAAAATGG 
CAAAGACTTC 
TATTTTTAAG 
AAGGGGTTTT 
GGCACGAACC 
TGGGACTACA 
TTTGTTTTTG 
GCTAGTCTCA 
ATTACAGCAC 
CTGGACCCTG 
AGGTTTCCTT 
GCTACTTGTC 
TCAAGCTGTG 
AGACAAGAGA 
AAAGATTTGT 
AACAACAGCC 
CGAGTTCCCA 
CTGAATACCT 
TGGGTTCTCA 
ACTGACAAG C 
ACTCAGAAGC 



31 
I 

TTATATAAAT 
AGAGATTTCT 
TTCCTGTTAC 
TCCTAACATT 
TTAAAGTATT 
AAAAGGGACA 
TGAACTAGTG 
CAGCATTTCC 
AACCCAGGAG 
TTGTTTTTTT 
TCATAGCTCC 
GGCATGAGCC 
GGGGGGGTTG 
AACT CCTGGC 
TTGGATTCAG 
AGAAGCTATT 
ATCATCTTAT 
CCTTCAATGC 
ATGACAGAAG 
CTCTGGCTGA 
GGGAGCAGAC 
CTGCGAGCAA 
AATCTCTGCC 
ATCTCATCAA 
TTTTCCTCCT 
ACACTTTTTT 
TTCCAAATAA 



41 
I 

TCAGGTTTTT 
AATAGAAAAG 
AGATTTGTTC 
GAGAGGTTTT 
GCCACTTTAG 
ATGTTAGTGT 
TTTCCAAGCA 
AGGTCCTAGA 
GAAAGCTTTA 
AAAGACAGGA 
TGGACTTAAG 
CCCATGCCTG 
TTTTGTTTTT 
TT CAAGTGAT 
CTTCTTCATT 
GCAATGCCCC 
CAAGTGCAGA 
TCGCCACCAG 
TTGTATTGAG 
GAGCACTTGG 
CAGCACCCCA 
CATAGTTACA 
GTATGTTCTG 
ATGCCAGACC 
AATCTAATTA 
CCTCCCCCCT 
ACCTTTGATA 



51 
i 

CCCACAATAA 60 

GATTCAAACT 12 0 

TCTTGTGACT 180 

CCCTTAGTGC 240 

CACTGAAGAT 300 

GGCCCTTCCT 360 

TATTGGAAGG 420 

GAGGAACAAG 480 

TAATAGAACA 540 

TCTCACTCCA 600 

TGATCTGCCT 660 

GCTAAGTTTG 720 

TGTAGAGACG 780 

CCTCCTGCCT 840 

TCCAACATGG 90 0 

TATGACAAAA 960 

AAGAATCATC 102 0 

GTTCCTCGAG 10 8 0 

CAAGATGTTG 1140 

CAGTGCCCTC 1200 

TTTGTCTGGG 1260 

GAACATAAG A 1320 

CCATGGAAAA 13 80 

CTAGAAGACT 1440 

TAGAATGGTA 1500 

TGAATCCTCA 1560 
CAGATTG 



80 



85 



Seq ID NO: 247 Protein sequence: 
Protein Accession #: XP_058553.1 

1 li 21 31 41 51 

I I I I I 1 

MEETYTDSLD PEKLLQCPYD KNHQIRACRF PYHLIKCRKN HPDVASKLAT CPFNARHQVP 

RAEISHHISS CDDRSCIEQD WNQTRSLRQ ETLAESTWQC PPCDEDWDKD LWEQTSTPFV 

WGTTHYSDNN SPASNIVTEH KNNLASGMRV PKSLPYVLPW KNNGNAQ 



60 
120 



282 



WO 02/086443 

Seq ID NO: 248 DNA sequence 
Nucleic Acid Accession #: NM_003392 
Coding sequence: 758.. 1855 



PCT7US02/12476 



5 



i 



li 



21 



31 



41 



51 



TTAAGGAAAT CCGGGCTGCT CTTCCCCATC TGGAAGTGGC TTTCCCCACA TCGGCTCGTA 60 

AACTGATTAT GAAACATACG ATGTTAATTC GGAGCTGCAT TTCCCAGCTG GGCACTCTCG 120 

10 CGCGCTGGTC CCCGGGGCCT CGCCCCCCAC CCCCTGCCCT TCCCTCCCGC GTCCTGCCCC 180 

CATCCTCCAC CCCCCGCGCT GGCCACCCCG CCTCCTTGGC AGCCTCTGGC GGCAGCGCGC 240 

TCCACTCGCC TCCCGTGCTC CTCTCGCCCA TGGAATTAAT TCTGGCTCCA CTTGTTGCTC 3 00 

GGCCCAGGTT GGGGAGAGGA CGGAGGGTGG CCGCAGCGGG TTCCTGAGTG AATTACCCAG 360 

GAGGGACTGA GCACAGCACC AACTAGAGAG GGGTCAGGGG GTGCGGGACT CGAGCGAGCA 42 0 

15 GGAAGGAGGC AGCGCCTGGC ACCAGGGCTT TGACT CAAC A GAATTGAGAC ACGTTTGTAA 48 0 

TCGCTGGCGT GCCCCGCGCA CAGGATCCCA GCGAAAATCA GATTTCCTGG TGAGGTTGCG 540 

TGGGTGGATT AATTTGGAAA AAGAAACTGC CTATATCTTG CCATCAAAAA ACT CACGGAG 60 0 

GAGAAGCGCA GTCAATCAAC AGTAAACTTA AGAGACCCCC GATGCTCCCC TGGTTTAACT 660 

TGTATGCTTG AAAATTATCT GAGAGGGAAT AAACATCTTT TCCTTCTTCC CTCT CCAGAA 72 0 

20 GT C CAT TGG A ATATTAAGCC CAGGAGTTGC TTTGGGGATG GCTGGAAGTG CAATGTCTTC 780 

CAAGTTCTTC CTAGTGGCTT TGGCCATATT TTTCTCCTTC GCCCAGGTTG TAATTGAAGC 840 

CAATTCTTGG TGGTCGCTAG GTATGAATAA CCCTGTTCAG ATGTCAGAAG TATATATTAT 90 0 

AGGAGCACAG CCTCTCTGCA GCCAACTGGC AGGACTTTCT CAAGGACAGA AGAAACTGTG 960 

CCACTTGTAT CAGGACCACA TGCAGTACAT CGGAGAAGGC GCGAAGACAG GCATCAAAGA 102 0 

25 ATGCCAGTAT CAATT CCGAC ATCGACGGTG GAACTGCAGC ACTGTGGATA ACACCTCTGT 10 80 

TTTTGGCAGG GTGATGCAGA TAGGCAGCCG CGAGACGGCC TTCACATACG CCGTGAGCGC 1140 

AGCAGGGGTG GTGAACGCCA TGAGCCGGGC GTGCCGCGAG GGCGAGCTGT CCACCTGCGG 12 00 

CTGCAGCCGC GCCGCGCGCC CCAAGGACCT GCCGCGGGAC TGGCTCTGGG GCGGCTGCGG 12 60 

CGACAACATC GACTATGGCT ACCGCTTTGC CAAGGAGTTC GTGGACGCCC GCGAG CGGG A 132 0 

30 GCGCATCCAC GCCAAGGGCT CCTACGAGAG TGCTCGCATC CTCATGAACC TGCACAACAA 13 80 

CGAGGCCGGC CGCAGGACGG TGTACAACCT GGCTGATGTG GCCTGCAAGT GCCATGGGGT 1440 

GTCCGGCTCA TGTAGCCTGA AGACATGCTG GCTGCAGCTG GCAGACTTCC GCAAGGTGGG 1500 

TGATGCCCTG AAGGAGAAGT ACGACAGCGC GGCGGCCATG CGGCTCAACA GCCGGGGCAA 1560 

GTTGGTACAG GTCAACAGCC GCTTCAACTC GCCCACCACA CAAGACCTGG TCTACATCGA 1620 

35 CCCCAGCCCT GACTACTGCG TGCGCAATGA GAGCACCGGC TCGCTGGGCA CGCAGGGCCG 1680 

CCTGTGCAAC AAGACGTCGG AGGGCATGGA TGGCTGCGAG CTCATGTGCT GCGGCCGTGG 1740 

GTACGACCAG TTCAAGACCG TGCAGACGGA GCGCTGCCAC TGCAAGTTCC ACTGGTGCTG 180 0 

CTACGTCAAG TGCAAGAAGT GCACGGAGAT CGTGGACCAG TTTGTGTGCA AGTAGTGGGT 1860 

GCCACCCAGC ACTCAGCCCC GCTCCCAGGA CCCGCTTATT TATAGAAAGT ACAGTGATTC 192 0 

40 TGGTTTTTGG TTTTTAGAAA TATTTTTTAT TTTTCCCCAA GAATTGCAAC CGGAACCATT 1980 

TTTTTTCCTG TTACCATCTA AGAACTCTGT GGTTTATTAT TAATATTATA ATTATTATTT 2040 

GGCAATAATG GGGGTGGGAA CCACGAAAAA TATTTATTTT GTGGATCTTT GAAAAGGTAA 2100 

TACAAGACTT CTTTTGGATA GTATAGAATG AAGGGGGAAA TAACACATAC CCTAACTTAG 2160 

CTGTGTGGGA CATGGTACAC ATCCAGAAGG TAAAGAAATA CATTTTCTTT TTCTCAAATA 2220 

45 TGCCATCATA TGGGATGGGT AGGTTCCAGT TGAAAGAGGG TGGTAGAAAT CTATTCACAA 2280 

TTCAGCTTCT ATGACCAAAA TGAGTTGTAA ATTCTCTGGT GCAAGATAAA AGGTCTTGGG 2340 

AAAACAAAAC AAAACAAAAC AAACCTCCCT TCCCCAGCAG GGCTGCTAGC TTGCTTTCTG 2400 

CATTTTCAAA ATGATAATTT ACAATGGAAG GACAAGAATG TCATATTCTC AAGGAAAAAA 2460 

GGTATATCAC ATGTCT CAT T CTCCTCAAAT ATTCCATTTG CAGACAGACC GTCATATTCT 252 0 

50 AATAGCTCAT GAAATTTGGG CAGCAGGGAG GAAAGTCCCC AGAAATTAAA AAATTTAAAA 2580 

CTCTTATGTC AAGATGTTGA TTTGAAGCTG TTATAAGAAT TGGGATTCCA GATTTGTAAA 2640 

AAGACCCCCA ATGATTCTGG ACACTAGATT TTTTGTTTGG GGAGGTTGGC TTGAACATAA 2 700 

ATGAAAT AT C CTGTATTTTC TTAGGGATAC TTGGTTAGTA AATTATAATA GTAGAAATAA 2 760 

TACATG AAT C CCATTCACAG GTTTCTCAGC CCAAGCAACA AGGTAATTGC GTGCCATTCA 2 82 0 

55 GCACTGCACC AGAGCAGACA ACCTATTTGA GGAAAAACAG TGAAAT CCAC CTTCCTCTTC 2 880 

ACACTGAGCC CTCTCTGATT CCTCCGTGTT GTGATGTGAT GCTGGCCACG TTTCCAAACG 2 940 

GCAGCTCCAC TGGGTCCCCT TTGGT TGTAG GACAGGAAAT GAAACATTAG GAGCTCTGCT 3000 

TGGAAAACAG TTCACTACTT AGGGATTTTT GTTTCCTAAA ACTTTTATTT TGAGGAGCAG 3060 

TAGTTTTCTA TGTTTTAATG ACAGAACTTG GCTAATGGAA TTCACAGAGG TGTTGCAGCG 3120 

60 TATCACTGTT ATGATCCTGT GTTTAGATTA TCCACTCATG CTTCTCCTAT TGTACTGCAG 3180 

GTGTACCTTA AAACTGTTCC CAGTGTACTT GAACAGTTGC ATTTATAAGG GGGGAAATGT 3240 

GGTTTAATGG TGCCTGATAT CTCAAAGTCT TTTGTACATA ACATATATAT ATATATACAT 3300 

ATATATAAAT ATAAATATAA ATATATCTCA TTGCAGCCAG TGATTTAGAT TTACAGCTTA 3360 

CTCTGGGGTT ATCTCTCTGT CTAGAGCATT GTTGTCCTTC ACTGCAGTCC AGTTGGGATT 3420 

65 ATT CCAAAAG TTTTTTGAGT CTTGAGCTTG GGCTGTGGCC CCGCTGTGAT CATACCCTGA 3480 

GCACGACGAA GCAACCTCGT TTCTGAGGAA GAAGCTTGAG TTCTGACTCA CTGAAATGCG 3540 

TGTTGGGTTG AAGATATCTT TTTTTCTTTT CTGCCTCACC CCTTTGTCTC CAACCTCCAT 3 60 0 

TTCTGTTCAC TTTGTGGAGA GGGCATTACT TGTTCGTTAT AGACATGGAC GTTAAGAGAT 3660 

ATTCAAAACT CAGAAGCATC AGCAATGTTT CTCTTTTCTT AGTTCATTCT GCAGAATGGA 372 0 

70 AACCCATGCC TATTAGAAAT GACAGTACTT ATTAATTGAG TCCCTAAGGA ATATTCAGCC 3780 

CACTACATAG ATAGCTTTTT TTTTTTTTTT TTTTTTTTAA TAAGGACACC TCTTTCCAAA 3840 

CAGGCCATCA AATATGTTCT TATCTCAGAC TTACGTTGTT TTAAAAGTTT GGAAAGATAC 3900 

ACATCTTTTC ATACCCCCCC TTAGGAGGTT GGGCTTTCAT AT CACCTCAG CCAACTGTGG 3 960 

CTCTTAATTT ATTGCATAAT GATATCCACA TCAGCCAACT GTGGCTCTTT AATTTATTGC 402 0 

75 ATAATGATAT TCACATCCCC TCAGTTGCAG TGAATTGTGA GCAAAAGATC TTGAAAGCAA 4080 

AAAGCACTAA TTAGTTTAAA ATGTCACTTT TTTGGTTTTT ATTATACAAA AACCATGAAG 4140 

TACTTTTTTT ATTTGCTAAA TCAGATTGTT CCTTTTTAGT GACTCATGTT TATGAAGAGA 42 00 

GTTGAGTTTA ACAATCCTAG CTTTTAAAAG AAACTATTTA ATGTAAAATA TTCTACATGT 42 60 

CATTCAGATA TTATGTATAT CTTCTAGCCT TTATTCTGTA CTTTTAATGT ACATATTTCT 432 0 

80 GTCTTGCGTG ATTTGTATAT TTCACTGGTT TAAAAAACAA ACATCGAAAG GCTTATTCCA 43 8 0 
AATGGAAGAT AGAATATAAA ATAAAACGTT ACTTGTAAAA AAAAAAAA 



85 



Seq ID NO: 249 Protein sequence: 
Protein Accession #: NP 003383 



1 



11 



21 



31 



41 



51 



283 



WO 02/086443 

MAGSAMSSKF FLVALAIFFS FAQWIEANS WWSLGMNNPV QMSEVYIIGA QPLCSQLAGL 
SQGQKKLCHL YQDHMQYIGE GAKTG I KECQ YQFRHRRWNC STVDNTSVFG RVMQIGSRET 
AFTYAVSAAG WNAMSRACR EGELSTCGCS RAARPKDLPR DWLWGGCGDN IDYGYRFAKE 
FVDARERERI HAKGSYESAR I LMNLHNNE A GRRTVYNLAD VACKCHGVSG SCSLKTCWLQ 
LAD FRKVGD A LKEKYD S AAA MRLNSRGKLV QVNSRFNSPT TQDLVYIDPS PDYCVRNEST 
GSLGTQGRLC NKTSEGMDGC ELMCCGRGYD QFKTVQTERC HCKFHWCCYV KCKKCTEIVD 
QFVCK 

Seq ID NO: 250 DNA sequence 
Nucleic Acid Accession ft: NM_014058 
Coding sequence: 56.. 1324 

1 11 21 31 41 51 

l l I l l l 

TGACTTGGAT GTAGACCTCG ACCTTCACAG GACTCTTCAT TGCTGGTTGG CAATGATGTA 
TCGGCCAGAT GTGGTGAGGG CTAGGAAAAG AGTTTGTTGG GAACCCTGGG TTATCGGCCT 
CGTCATCTTC ATATCCCTGA TTGTCCTGGC AGTGTGCATT GGACTCACTG TTCATTATGT 
GAGATATAAT CAAAAGAAGA CCTACAATTA CTATAGCACA TTGTCATTTA CAACTGACAA 
ACTATATGCT GAGTTTGGCA GAGAGGCTTC TAACAATTTT ACAGAAATGA GCCAGAGACT 
TGAATCAATG GTGAAAAATG CATTTTATAA ATCTCCATTA AGGGAAGAAT TTGT CAAGTC 
TCAGGTTATC AAGTTCAGTC AACAGAAGCA TGGAGTGTTG GCTCATATGC TGTTGATTTG 
TAGATTTCAC TCTACTGAGG ATCCTGAAAC TGTAGATAAA ATTGTT CAAC TTGTTTTACA 
TGAAAAGCTG CAAGATGCTG TAGGACCCCC TAAAGTAGAT CCTCACTCAG TTAAAATTAA 
AAAAATCAAC AAGACAGAAA CAGACAGCTA TCTAAACCAT TGCTGCGGAA CACGAAGAAG 
TAAAACTCTA GGT CAGAGTC TCAGGATCGT TGGTGGGACA GAAGTAGAAG AGGGTGAATG 
GCCCTGGCAG GCTAGCCTGC AGTGGGATGG GAGTCATCGC TGTGGAGCAA CCTTAATTAA 
TGCCACATGG CTTGTGAGTG CTGCTCACTG TTTTACAACA TATAAGAACC CTGCCAGATG 
GACTGCTTCC TTTGGAGTAA CAATAAAACC TTCGAAAATG AAACGGGGTC TCCGGAGAAT 
AATTGTCCAT GAAAAATACA AACACCCATC ACATGACTAT GATATTTCTC TTGCAGAGCT 
TTCTAGCCCT GTTCCCTACA CAAATGCAGT ACATAGAGTT TGTCTCCCTG ATGCATCCTA 
TGAGTTTCAA CCAGGTGATG TGATGTTTGT GACAGGATTT GGAGCACTGA AAAATGATGG 
TTACAGTCAA AATCATCTTC GACAAGCACA GGTGACTCTC ATAGACGCTA CAACTTGCAA 
TGAACCTCAA GCTTACAATG ACGCCATAAC TCCTAGAATG TTATGTGCTG GCTCCTTAGA 
AGGAAAAACA GATGCATGCC AGGGTGACTC TGGAGGACCA CTGGTTAGTT C AG ATG C TAG 
AGATATCTGG TACCTTGCTG GAATAGTGAG CTGGGGAGAT GAATGTGCGA AAC C CAAC AA 
GCCTGGTGTT TATACTAGAG TTACGGCCTT GCGGGACTGG ATTACTTCAA AAACTGGTAT 
CTAAGAGAGA AAAGCCTCAT GGAACAGATA ACATTTTTTT TTGTTTTTTG GGTGTGGAGG 
CCATTTTTAG AGATACAGAA TTGGAGAAGA CTTGCAAAAC AGCTAGATTT GACTGATCTC 
AATAAACTGT TTGCTTGATG CAAAAAAAAA A 



Seq ID NO: 251 Protein sequence: 
Protein Accession #: NP_054777 

1 11 21 31 41 51 

I I I I I I 

MYRPDWRAR KRVCWEPWVI GDVIFISLIV LAVC I GLTVH YVRYNQKKTY NYYSTLSFTT 

DKLYAEFGRE ASNNFTEMSQ RLESMVKNAF YKSPLREEFV KSQVIKFSQQ KHGVLAHMIjD 

ICRFHSTEDP ETVDKIVQLV LHEKLQDAVG PPKVDPHSVK IKKINKTETD SYLNHCCGTR 

RSKTLGQSLR IVGGTEVEEG EWPWQASLQW DGSHRCGATL I NAT WL VS AA HCFTTYKNPA 

RWTASFGVTI KPSKMKRGLR R I I VHEKYKH PSHDYDISLA ELSSPVPYTN AVHRVCLPDA 

SYEFQPGDVM FVTGFGALKN DGYSQNHLRQ AQVTLIDATT CNEPQAYNDA ITPRMLCAGS 

LEGKTDACQG DSGGPLVSSD ARDIWYLAGI VSWGDECAKP NKPGVYTRVT ALRDWITSKT 

GI 

Seq ID NO: 252 DNA sequence 

Nucleic Acid Accession #: NM_003504.2 

Coding sequence: 71-1771 

1 ll 21 31 41 51 

I i i i i I 

GGCACGAGGC CTCGTGCCGC CGGGCTCTTG GT AC C T C AG C GCGAGCGCCA GGCGTCCGGC 
CGCCGTGGCT ATGTTCGTGT CCGATTTCCG CAAAGAGTTC TACGAGGTGG TCCAGAGCCA 
GAGGGTCCTT CTCTTCGTGG CCTCGGACGT GGATGCTCTG TGTGCGTGCA AGATCCTTCA 
GGCCTTGTTC CAGTGTGACC ACGTGCAATA TACGCTGGTT CCAGTTTCTG GGTGGCAAGA 
ACTTGAAACT GCATTTCTTG AGCATAAAGA ACAGTTTCAT TATTTTATTC TCATAAACTG 
TGGAGCTAAT GTAGACCTAT TGGATATTCT TCAACCTGAT GAAGACACTA TATTCTTTGT 
GTGTGACACC CATAGGCCAG TCAATGTCGT CAATGTATAC AACGATACCC AGATCAAATT 
ACTCATTAAA CAAGATGATG ACCTTGAAGT TCCCGCCTAT GAAGACATCT T CAGGG ATG A 
AGAGGAGGAT GAAGAGCATT CAGGAAATGA CAGTGATGGG TCAGAGCCTT CTGAGAAGCG 
CACACGGTTA GAAGAGGAGA TAGTGGAGCA AACCATGCGG AGGAGGCAGC GGCGAGAGTG 
GGAGGCCCGG AGAAGAGACA TCCTCTTTGA CTACGAGCAG TATGAATATC ATGGGACATC 
GTCAGCCATG GTGATGTTTG AGCTGGCTTG GATGCTGTCC AAGGACCTGA ATGACATGCT 
GTGGTGGGCC ATCGTTGGAC TAACAGACCA GTGGGTGCAA GACAAGATCA CTCAAATGAA 
ATACGTGACT GATGT TGGTG TCCTGCAGCG CCACGTTTCC CGCCACAACC ACCGGAACGA 
GGATGAGGAG AACACACT CT CCGTGGACTG CACACGGATC TCCTTTGAGT ATGACCTCCG 
CCTGGTGCTC TACCAGCACT GGTCCCTCCA TGACAGCCTG TGCAACACCA GCTATACCGC 
AGCCAGGTTC AAGCTGTGGT CTGTGCATGG ACAGAAGCGG CTCCAGGAGT TCCTTGCAGA 
CATGGGTCTT CCCCTGAAGC AGGTGAAGCA GAAGTTCCAG GCCATGGACA TCTCCTTGAA 
GGAGAATTTG CGGGAAATGA TTGAAGAGTC TGCAAATAAA TTTGGGATGA AGGACATGCG 
CGTGCAGACT TTCAGCATTC ATTTTGGGTT CAAGCACAAG TTTCTGGCCA GCGACGTGGT 
CTTTGCCACC ATGTCTTTGA TGGAGAGCCC CGAGAAGGAT GGCTCAGGGA CAGATCACTT 
CAT CCAGGCT CTGGACAGCC TCTCCAGGAG TAACCTGGAC AAGCTGTACC ATGGCCTGGA 
ACTCGCCAAG AAGCAGCTGC GAGCCACCCA GCAGACCATT GCCAGCTGCC TTTGCACCAA 
CCTCGTCATC TCCCAGGGGC CTTTCCTGTA CTGCTCTCTC ATGGAGGGCA CTCCAGATGT 
CATGCTGTTC TCTAGGCCGG CATCCCTAAG CCTGCTCAGC AAACACCTGC TCAAGTCCTT 
TGTGTGTTCG ACAAAGAACC GGCGCTGCAA ACTGCTGCCC CTGGTGATGG CTGCCCCCCT 



284 



WO 02/086443 

GAGCATGGAG CATGGCACAG 
CAGGAAGAAC TTTTTTGGGA 
GCTGCACAAC CATTTTGACC 
TCTGGACGCA CTTATTTCCC 
ATTTATGTAA CTGGCTTTCA 
CCATTTTTTA TTAAATAAAA 
AAAAAAAAAA AA 



PCT/US02/12476 



TGACCGTGGT 
GGGCGTTTGA 
TCTCAGTAAT 
TCCTGTCCTA 
TTTAGATTGT 
TGCTTATTTT 



GGGCATCCCC 
GAAGGCAGCG 
TGAGCTGAAA 
GGAATTTGAT 
AAGTTATGGA 
AGGCTCCGTC 



CCAGAGACCG 
GAAAGCACCA 
GCTGAGGATC 
TCTTCCAGAA 
CATGATT TGA 
CCCAAAAAAA 



ACAGCTCGGA 1620 

GCTCCCGGAT 1680 

GGAGCAAGTT 1740 

TGACCTTCTT 1800 

GATGTAGAAG 1860 

AAAAAAAAAA 1920 



Seq ID NO: 253 Protein sequence: 
10 Protein Accession #: NP 003495.1 



15 



20 



25 



MFVSDFRKEF 
AFLEHKEQFH 
QDDDLEVPAY 
RRDILFDYEQ 
DVGVLQRHVS 
KLWSVHGQKR 
FSIHFGFKHK 
KQLRATQQTI 
TKNRRCKIiLP 
HFDLSVIELK 



11 
I 

YEWQSQRVI* 
YFILINCGAN 
ED I FRDEEED 
YEYHGT S SAM 
RHNHRNEDEE 
LQEFLADMGL 
FLASDWFAT 
ASCLCTNLVI 
LVMAAPLSME 
AEDRSKFLDA 



21 

I 

LFVASDVDAL 
VDLLDILQPD 
EEHSGNDSDG 
VMFELAWMLS 
NTLSVDCTRI 
PLKQVKQKFQ 
MSLMESPEKD 
SQGPFLYCSL 
HGTVTWGIP 
LISLLS 



31 
I 

CACKILQALF 
EDT I FFVCDT 
SEPSEKRTRI) 
KDLNDMLWWA 
SFEYDLRLVL 
AMDISLKENL 
GSGTDHFIQA 
MEGTPDVMLF 
PETDSSDRKN 



41 

I 

QCDHVQYTLV 
HRPVNWNVY 
EEEIVEQTMR 
IVGLTDQWVQ 
YQHWSLHDSL 
REMIEESANK 
LDSIjSRSNLD 
SRPASLSLLS 
FFGRAFEKAA 



51 
I 

PVSGWQELET 60 

NDTQIKLLIK 120 

RRQRREWEAR 180 

DKITQMKYVT 240 

CNTSYTAARF 3 00 

FGMKDMRVQT 3 60 

KLYHGLELAK 420 

KHLLKSFVCS 480 

EST SSRMLHN 540 



Seq ID NO: 254 DNA sequence 
Nucleic Acid Accession #: NM_022337 
Coding sequence: 48.. 683 



30 



35 



40 



45 



50 



55 



60 



i 

I 

GGCTGCGCTT 
ACAAGGAGCA 
T CATC AAGCG 
ACTTCGCGCT 
ATATCGCAGG 
GTGCATTTAT 
AAAATGATTT 
TGGCCAACAA 
AGTTCTGCAA 
ACATTGATGA 
TGGAGTCTAT 
GCTCTGGCTG 
TTGTTCCACA 
CACATGTGGC 
GTTCTTTCTA 
TCTGTTACAA 
TTATTTGCTT 
AACTAGCTGT 
AATATATTCT 
GACCTCCATT 
ACAGGTGTGC 
AACTGAATAT 
CTCAAGCTGT 
GCAAGTGAAC 



11 



CCCTGGTCAG 
CCTGTACAAG 
CTACGTGCAC 
CAAGGTGCTC 
TCAAGAAAGA 
TGTCTTCGAT 
GGACTCCAAG 
ATGTGACCAG 
GGAGCACGGT 
AGCCT CCAGA 
TGAGCCGGAC 
TGCCAAATCC 
AATTGTGCCT 
AAGCCAAAGA 
TGCTTTCCTC 
ACTTCTGTCA 
CTTTTAATCA 
CAAGTCAAGG 
CTGATGGCCT 
CTCGGCAGAC 
TATATTGTCC 
TGTATGAAAA 
GGGGCTCCTC 
AATAAAACAT 



21 
I 

GCACGGCACG 
TTGCTGGTGA 
CAGAACTTCT 
CACTGGGACC 
TTTGGAAACA 
GTCACCAGGC 
TTAAGTCTCC 
GGGAAGGATG 
TTCGTAGGAT 
TGCCTGGTGA 
GTCGTGAAGC 
TAGTAGGCAC 
CTATTTTTAC 
TCTATGCCTC 
ACCATCATCA 
TGTAGCTGAC 
GCAAAGGCCT 
ACTGGCTTTC 
GACAGGCCTA 
CTAAGAGTTG 
TTGTCCTAAC 
GACATGCCTC 
TATACATGCT 
TAAAAGATAA 



31 



TCTGGCCGGC 
TTGGCGACCT 
CCTCGCACTA 
CGGAGACTGT 
TGACGAGGGT 
CAGCCACATT 
CTAATGGCAA 
TGCT CATGAA 
GGTTTGAAAC 
AACACATACT 
CCCATCTCAC 
CTTTGCTGGT 
CATTTTGGGT 
TGTTTTTTCA 
CAGTGTTTAC 
CAAAATCCTG 
CAAGTCTTAA 
ACCTTGCCCT 
TTAAGTAGAT 
CCTCTGAGTT 
TGTCACTTGC 
CATATGTGCC 
ATACATGTAA 
AA 



41 
I 

CGCCAGGATG 
GGGCGTGGGG 
CCGGGCCACA 
GGTGCGCCTG 
CTATTACCGA 
TGAAGCAGTG 
ACCGGTTTCA 
CAATGGCCTC 
ATCAGCAAAG 
TGCAAATGAG 
ATCAACCAAG 
GTCTGGTAGG 
AAACGTCAGG 
ATGAGAGAGA 
AAACTTTTGA 
CAGGGCCACA 
AATAAAAGGG 
GGTGTCTTTT 
GTGATATTTT 
AGCTCTTTGG 
CATGGCCTGA 
TTTCTGTTAG 
TATATATTAT 



51 
I 

CAGGCCCCGC 
AAGACCAGTA 
AT CGGCGTGG 
CAGCTCTGGG 
GAAGCTATGG 
GCAAAGTGGA 
GTGGTTTTGT 
AAGATGGACC 
GAAAATATAA 
TGTGACCTAA 
GTTGCCAGCT 
AATGACCTCA 
ATAGATATAC 
AATAGCAAAT 
AAATATTTAG 
GTCGGCACTG 
GAGAAGAACA 
TCCAGATTTC 
CTTCCAAGAT 
AATCGTGAAC 
ATGTTGGCTT 
CTCTCTTTGA 
ATATATTTTT 



Seq ID NO: 255 Protein sequence: 
Protein Accession #: NP 071732 



11 



65 



21 31 41 51 

I I I I 

MQAPHKEHLY KLLVIGDLGV GKTSIIKRYV HQNFSSHYRA TIGVDFADKV LHWDPETWR 

LQLWDIAGQE RFGNMTRVYY REAMGAFIVF DVTRPATFEA VAKWKNDLDS KLSLPNGKPV 

SWLLANKCD QGKDVLMNNG LKMDQFCKEH GFVGWFETSA KEN IN IDEAS RCLVKH I LAN 

ECDLMESIEP DWKPHLTST KVASCSGCAK S 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 



60 
120 
180 



70 



75 



80 



85 



Seq ID NO: 256 DNA sequence 
Nucleic Acid Accession #: NM__016321 
Coding sequence: 25.. 1464 



11 



GGAACCGCCC 
CCGCTGGCGG 
GGTGTTCGTG 
GAACTTGAGC 
CGTGATGGTC 
CGCCGTGGGC 
GGGCTGGTTC 
CGCTGACTTC 
CCCCATTCAG 
CATTCTCCTT 
TGGCGCCTAC 
CAAGGAGAGA 
CCTGTGGATG 
CCGAGCCGCC 



GCTGCCAGCC 
CTGCCGCTCA 
CGCTACGACT 
GACATGGAGA 
TTCGTGGGCT 
TTCAACTTCC 
CACTTCTTAC 
TGCGTGGCCT 
CTGCTCATCA 
AACCTGCTAA 
TTTGGGCTCA 
CAGAATTCTG 
TACTGGCCCA 
ATCAACACCT 



21 
I 

CGGCCAGGCA 
CCTGCCTGCT 
TCGAGGCCGA 
ACGAATTCTA 
TCGGCTTCCT 
TGTTGGCAGC 
AAGACCGCTA 
CTGTCTGCGT 
TGACTTTCTT 
AGGTGAAGGA 
CAGTGACCCG 
TGTACCAGTC 
GCTTCAACTC 
ACTGCTCCTT 



31 



CCCCTGCAGC 
CCTGCAGGTG 
CGCCCACTGG 
CT AT CGCTAC 
CATGACTTTC 
CTTCGGCATC 
CATCGTCGTG 
GGCCTTTGGG 
CCAAGTGACC 
TGCAGGAGGC 
GATCCTCTAC 
GGACCTCTTT 
AGCCATATCC 
GGCAGCCTGC 



41 
I 

ATGGCCTGGA 
ATTATGGTGA 
TGGTCAGAGA 
CCAAGCTTCC 
CTGCAGCGCT 
CAGTGGGCGC 
GGCGTGGAGA 
GCAGTTCTGG 
CTCTTCGCTG 
TCCATGACCA 
CGACGCAACC 
GCCATGATTG 
TACCATGGGG 
GTGCTTACCT 



51 

1 

ACACCAACCT 60 

TTCTCTTCGG 12 0 

GGACGCACAA 180 

AGGACGTGCA 240 

ACGGCTTCAG 3 00 

TGCTCATGCA 3 60 

ACCT CATCAA 42 0 

GTAAAGTCAG 480 

TGAATGAGTT 540 

TCCACACATT 600 

TAGAGCAGAG 660 

GCACCCTCTT 720 

ACAGCCAGCA 780 

CGGTGGCAAT 840 



285 



WO 02/086443 

ATCCAGTGCC CTGCACAAGA AGGGCAAGCT 
CGCAGGAGGG GTGG CCGTGG GTACCGCTGC 
CATCAT CGGC TTCGTCTGCG GCATCATCTC 
CCTGGAGTCC CGGCTGCACA TCCAGGACAC 
TGGCAT CAT A GGCGGCATCG TGGGTGCTGT 
TGGAAAAGAA GGGCTTGTCC ATTCCTTTGA 
AAGAACACAG GGAAAGTTCC AGATTTATGG 
GGGTGGCATC ATTGTGGGGC TCATTTTGAG 
GAACTGCTTT GAGGATGCGG TCTACTGGGA 
CCCTGAGGAC CCCACCTTCA AGCCCTCAGG 
CCCACTACCC ATGGCTTCCT CGGTACCCTT 
GCAGGCTCCA CAGACTSTCC TGGGGCCCAG 
AAGAGTGAGC AAGCAGCACC CCCACCTGCT 
CCTCCCCTTC AT CCCAGGGG GTCTGMCTGA 
ATCCAAGCCG GGTTCTGGCT GCAGAAGTTC 
AGAAAAACAG GCTCAAAGTG GGGCTGGGAC 
ACAACTTAGC TGCCAGTCAC CACCTATGAG 
AGCATCTCCT ATGCTCCCTG GGTCCCCCAG 
CAGGAATAAA CATTCTTGTT GTCCTTTGTA 



GGACATGGTG CACATCCAGA ATGCCACGCT 900 

TGAGATGATG CTCATGCCTT ACGGTGCCCT 960 

CACCCTGGGT TTTGTATACC TGACCCCATT 102 0 

ATGTGGCATT AACAATCTGC ATGGCATTCC 1080 

GACAGCGGCC TCCGCCAGCC TTGAAGTCTA 1140 

CTTTCAAGGT TTCAACGGGG ACTGGACCGC 1200 

TCTCTTGGTG ACCCTGGCCA TGGCCCTGAT 12 60 

ATTACCATTC TGGGGACAAC CTTCAGATGA 1320 

GATGCCTGAA GGGAACAGCA CTGT CTACAT 13 80 

ACCCTCAGTA CCCTCAGTAC CCATGGTGTC 1440 

GGTACCCTAG GCTCCCAGGG CAGGTGAGGA 1500 

AGGAGCTGGT GCTGACCTAG CTAGGGATGC 1560 

GGCTTGGCCT CAAGGTGCCT CCACCCCTGC 1620 

GAATGGAGAA GGAGAAGCTA CAAAGTGGGC 1680 

TGCCTCTGCC TGGGGTCTTG GCCACATTGG 1740 

CTGGTGGGTG AACCTGAGCT CTCCCAGGAG 1800 

GCTCTTCTAC CCCGTGCCTG CACCTCGGCC 1860 

ACCTCTCTGT GTTGTGTGCG TGGCAGCCTC 1920 
AAAAAAAAAA AAAAAAAA 



Seq ID NO: 2 57 Protein sequence ; 
Protein Accession #: NP 057405 



MAWNTNLRWR 
PSFQDVHVMV 
GVENLINADF 
SMTIHTFGAY 
YHGD SQHRAA 
LMPYGALIIG 
SASLEVYGKE 
WGQPSDENCF 



11 
I 

L.PLTCLLLQV 
FVGFGFLMTF 
CVASVCVAFG 
FGLTVTRILY 
INTYCSLAAC 
FVCGIISTLG 
GLVHSFDFQG 
EDAVYWEMPE 



21 



IMVILFGVFV 
LQRYGFSAVG 
AVLGKVSPIQ 
RRNLEQSKER 
VLTSVAISSA 
FVYLTPFLES 
FNGDWTARTQ 
GNSTVYIPED 



31 
I 

RYDFEADAHW 
FNFLLAAFGI 
LLIMTFFQVT 
QNSVYQSDLF 
LHKKGKLDMV 
RLHIQDTCGI 
GKFQIYGLLV 
PTFKPSGPSV 



41 

WSERTHKNLS 
QWALLMQGWF 
LFAVNEFILL 
AM I GTLFLWM 
HIQNATLAGG 
NNLHGIPGII 
TLAMALMGGI 
PSVPMVSPLP 



51 

I 

DMENEFYYRY 60 

HFLQDRYIW 120 

NLLKVKDAGG 180 

YWPSFNSAIS 240 

VAVGTAAEMM 30 0 

GGIVGAVTAA 360 

IVGLILRLPF 420 
MASSVPLVP 



Seq ID NO: 258 DNA sequence 

Nucleic Acid Accession #: NM_002358.2 

Coding sequence: 75.-692 



1 11 21 31 41 51 

I I I I I I 

GGGAAGTGCT GTTGGAGCCG CTGTGGTTGC TGTCCGCGGA GTGGAAGCGC GTGCTTTTGT 60 

TTGTGTCCCT GGCCATGGCG CTGCAGCTCT CCCGGGAGCA GGGAATCACC CTGCGCGGGA 12 0 

GCGCCGAAAT CGTGGCCGAG TTCTTCTCAT TCGGCATCAA CAGCATTTTA TATCAGCGTG 180 

GCATATATCC ATCTGAAACC TTTACTCGAG TGCAGAAATA CGGACTCACC TTGCTTGTAA 240 

CTACTGATCT TGAGCTCATA AAATACCTAA ATAATGTGGT GGAACAACTG AAAGATTGGT 300 

TATACAAGTG TT CAGTTC AG AAACTGGTTG TAGTTATCTC AAATATTGAA AGTGGTGAGG 360 

TCCTGGAAAG ATGGCAGTTT GATATTGAGT GTGACAAGAC TGCAAAAGAT GACAGTGCAC 420 

CCAGAGAAAA GTCTCAGAAA GCTATCCAGG. ATGAAATCCG TTCAGTGATC AGACAGATCA 480 

CAGCTACGGT GACATTTCTG CCACTGTTGG AAGTTTCTTG TTCATTTGAT CTGCXGATTT 540 

ATACAGACAA AGATTTGGTT GTACCTGAAA AATGGGAAGA GTCGGGACCA CAGTTTATTA 600 

CCAATTCTGA GGAAGTCCGC CTTCGTTCAT TTACTACTAC AATCCACAAA GTAAATAGCA 660 

TGGTGGCCTA CAAAATTCCT GTCAATGACT GAGGATGACA TGAGGAAAAT AATGTAATTG 720 

TAATT TTGAA ATGTGGTTTT CCTGAAATCA GGT CAT CTAT AGTTGATATG TTTTATTTCA 780 

TTGGTTAATT TTTACATGGA GAAAACCAAA ATGATACTTA CTGAACTGTG TGTAATTGTT ' 840 

CCTTTATTTT TTTGGTACCT ATTTGACTTA CCATGGAGTT AACATCATGA ATTTATTGCA 90 0 

CATTGTTCAA AAGGAACCAG GAGGTTTTTT TGTCAACATT GTGATGTATA TTCCTTTGAA 960 

GATAGTAACT GTAGATGGAA AAACTTGTGC TATAAAGCTA GATGCTTTCC TAAATCAGAT 102 0 

GTTTTGGTCA AGTAGTTTGA CTCAGTATAG GTAGGGAGAT ATTTAAGTAT AAAATACAAC 1080 

AAAGGAAGTC TAAATATTCA GAATCTTTGT TAAGGTCCTG AAAGTAACTC ATAATCTATA 1140 

AACAATGAAA TATTGCTGTA TAGCTCCTTT TGACCTTCAT TTCATGTATA GTTTTCCCTA 120 0 

TTGAATCAGT TTCCAATTAT TTGACTTTAA TTTATGTAAC TTGAACCTAT GAAGCAATGG 1260 

ATATTTGTAC TGTTTAATGT TCTGTGATAC AGAACTCTTA AAAATGTTTT TTCATGTGTT 132 0 

TT ATAAAAT C AAGTTTTAAG TGAAAGTGAG GAAATAAAGT TAAGTTTGTT TTAAAAAAAA 13 80 
AAAAAAAAAA 



Seq ID NO: 25 9 Protein sequence: 
Protein Accession #: NP_002349.1 

1 ll 21 31 41 51 

I I I I I 1 

MALQLSREQG ITLRGSAEIV AEFFSFGINS ILYQRGIYPS ETFTRVQKYG LTLLVTTDLE 60 
LIKYLNNWE QLKDWLYKCS VQKLVWISN IESGEVLERW QFDIECDKTA KDDSAPREKS 120 
QKAIQDEIRS VIRQITATVT FLPLIiEVSCS FDL.LIYTDKD LWPEKWEES GPQFITNSEE 180 
VRLRSFTTTI HKVNSMVAYK IPVND 

Seq ID NO: 2 60 DNA sequence 
Nucleic Acid Accession #: NM_001211 
Coding sequence: 43.. 3195 

1 11 21 31 41 51 

I I I I I I 

AAAGGCCTGC AGCAGGACGA GGACCTGAGC CAGGAATGCA GGATGGCGGC GGTGAAGAAG 60 

GAAGGGGGTG CTCTGAGTGA AGCCATGTCC CTGGAGGGAG ATGAATGGGA ACTGAGTAAA 120 

GAAAATGTAC AACCTTTAAG GCAAGGGCGG ATCATGT CCA CGCTTCAGGG AGCACTGGCA 180 

CAAGAAT CTG CCTGTAACAA TACTCTTCAG CAGCAGAAAC GGGCATTTGA ATATGAAATT 240 



286 



WO 02/086443 

CGATTTTACA CTGGAAATGA 
CAGAACTATC CTCAAGGTGG 
GAAGCACTAC AAGGAGAAAA 
AAATTAGGGC GTTTATGCAA 
5 ATTGGTGTTT CACTTGCTCA 

AACTTTAGGA AAGCAGATGC 
GAAAGACTAC AGTCCCAGCA 
GCACTTGAGA AAGAAGAAGA 
CTAGCTGAAC TAAAGAGCAA 
10 GGTGCTCTCA AGGCTCCAAG 
CAAAATAATA GTAGAATTAC 
TTGTCTAAGC CTACAGTCCA 
GAGCTGCAAG CAGGCCCTTG 
ACAGCTTCAC TGATAGCTGT 
15 ACTGCACAAC AGCCAGTTAT 

AGCACCAGAA AGCCTGGAAA 
CAAGCGTCTG AGGAGAAGAA 
GTAGGGGAAT TCTCCTTTGA 
CAAAGGGAAG CCGAGCTATT 
20 GAAGAGATGG AGAAGAAGCT 

CAGCAAGAAG AGACGATGCC 
CAGAAAATAC CAGGAATGAC 
GAAACTTCAC TTGCGGAGAA 
CCTTTCTCCA TTTTTGATGA 
25 GATCCCCCAC GAGTTTTAGC 

ATCACCTCAA ATGAAGATGT 
TTGAGCGAGG ATGCC AT TAT 
GACACTTGTG ACTTTGCCAG 
TCCTTGAAGG ATCTCCCTTC 
30 AAGACCTCTG AGGACCAGCA 

AAGAAGCTGA GCCCAATTAT 
GGTTCTTCTG CCTCGGTTGC 
CTAGAACTTA CTAATGAGAC 
CGCAGACAGC TACTGAAGTC 
35 GACAGACCAA TGCCTAAGTT 

TGCATTAAAC GAGAATACCT 
AACTCTGCAG AATTAACAGT 
ATCAACCTCA AGTTAAAGGA 
CAATATCAAG ATGGCTGTAT 
40 CTTCTCCAAC ACAGTGAATA 

TTGACAATAG TGGAGATGCT 
TGTCTGATTC TCAGAAACAG 
TTGAAGATAG TGGACTTTTC 
CTCAGCGGCT TTCGGACTGT 
TCTCCCTACC AGGTAGACCT 
GAACACCTAC AGGTCTTCTG 
CTAAAAGATG GTGAATTGTG 
GCCACAGTGT CTGTTCTTGG 
TTCCAAAGTC ACCTGAACAA 
50 TTGCTCTTTC AGTGAGCTAG 

GTATTGTGGA ACACTGAAAC 
CTACCATTGC TGTTCTACTT 
ACAGTGATAT ACTTACTCAT 
CAGACTCATT ACAAATGGTT 
55 CTTTTCCCAT TTGTAATTTG 

TAAAATAGTA TCTGTTAAAA 



PCT/US02/12476 



45 



CCCTCTGGAT 
GAAAGAGAGT 
ACGATATTAT 
TGAGCCTTTG 
GTTCTATATC 
GATATTTCAG 
CCGACAATTC 
GGAGGAAGTT 
AGGGAAAAAG 
CCAGAACAGA 
TGTTTTTGAT 
GCCATGGATA 
GAACACAGGC 
ACCCGCTGTG 
GACACCATGT 
GGAAGAAGGA 
AGAGAAGATG 
AGAAATTCGG 
GACCAGTGCA 
AAAAGAAATC 
TACAAAGGAG 
TCTATCCAGT 
CATTTGGCAG 
GTTTCTTCTT 
TCAACGAAGA 
GTCTCCAGAT 
CACAGGCTTC 
AGCAGCTCGT 
TGATCCTGAG 
GACAGCTTGT 
TGAAGACAGT 
AAGCACCTCC 
TTCAGAAAAC 
CCTACCAGAG 
GGAAATTGAG 
AATATGTGAA 
AATAAAGGTA 
ACGTTTAAAT 
TGTTTGGCAC 
TATTACCCAT 
ACACAAAGCA 
AATCCACGAT 
CTACAGTGTT 
ACAGATCCTG 
GTTTGGTATA 
GGATGGGTCC 
GAATAAATTC 
GGAGCTTGCA 
AGCCTTATGG 
GCAAT CAAGT 
TGTATGTGCT 
TTTGGTACAG 
GGCCTTGTCT 
ACCTTGTTAT 
TAAAATGTTC 
AAAAAAAAAA 



GTTTGGGATA 
AATATGTGAA 
AGTGATCCTC 
GATATGTACA 
TCATGGGCAG 
GAAGGGATTC 
CAAGCTCGAG 
TTTGAGTCTT 
ACAGCAAGAG 
GGACTCCAAA 
GAAAATGCTG 
GCACCCCCCA 
AGGTCCTTGG 
CTTCCCAGTT 
AAAATTGAAC 
GATCCT CTAC 
ATGTATTGTA 
GCTGAAGTTT 
GAGAAGAGAG 
CAAACTACTC 
ACAACTAAAC 
TCTGTTTGTC 
GAACAACCTC 
TCAGAAAAGA 
CCCCTTGCAG 
GTTTGTGATG 
AGAAATGTAA 
TTTGTATCCA 
AGACTGTTAC 
GGCACTATCT 
CGTGAAGCCA 
TCCATCAAAT 
CCTACTCAGT 
TTAAGTGCCT 
AAGGAAATTG 
GATTACAAGT 
TCTTCTCAAC 
GAAGATTTTG 
CAATATATAA 
GAAATAACAG 
GAAATAGTCC 
CCCTATGATT 
GACCTTAGGG 
GAAGGACAAA 
GCAGATTTAG 
TTCTGGAAAC 
TTTGTGCGGA 
G CAGAAATGA 
AAGGTAGGGA 
CTCACAGATT 
GTAATTTAAT 
GTATATTTTG 
AACTTTTGTG 
TTAACCCATT 
TCTTATGATC 
AAAAAAAAAA 



GGTATAT CAG 
CGTTATTAGA 
GATTTCTCAA 
GTTACTTGCA 
AAGAATATGA 
AACAGAAGGC 
TGTCTCGGCA 
CTGTACCACA 
CTCCAATCAT 
ATCCATTTCC 
ATGAGGCTTC 
TGCCCAGGGC 
AACACAGGCC 
TCACTCCATA 
CTAGTATAAA 
AAAGGGTTCA 
AGGAGAAGAT 
TCCGGAAGAA 
CAGAAATGCA 
AGCAAGAAAG 
TGCAAATTGC 
AAGTAAACTG 
ATTCTAAAGG 
AGAATAAAAG 
TTCTCAAAAC 
AATTTACAGG 
CAATTTGTCC 
CTCCTTTTCA 
CGGAAGAAGA 
ACAGTCAGAC 
CACACTCCTC 
GTCTTCAAAT 
CACCATGGTG 
CTGCAGAGTT 
AATTAGGTAA 
TATTCTGGGT 
CTGTCCCATG 
ATCATTTTTG 
ACTGCTTCAC 
TGTTGATTAT 
ATGGTGACTT 
GTAACAAGAA 
TGCAGCTGGA 
AGATCCTGGC 
CACATTTACT 
TTAGCCAAAA 
TTCTGAATGC 
ATGGGGTTTT 
AGTTAACTAG 
GCTGCCTCAG 
TTAGGACACA 
ACGTCACTGA 
AAGAACTATT 
TGTCTCTACT 
ACCATGTATT 
AAA 



CTGGACAGAG 3 0 0 
AAGAGCTGTA 360 
TCTCTGGCTT 420 
CAACCAAGGG 480 
AGCTAGAGAA 540 
TGAACCACTA 600 
AACTCTGTTG 660 
ACGAAGCACA 720 
CCGTGTAGGA 780 
TCAACAGATG 840 
TACAGCAGAG 900 
CAAAGAGAAT 960 

TCGTGGCAAT 1020 

TGTGGAAGAG 1080 

CCACATCCTA 1140 

GAGCCAT CAG 1200 

TTATGCAGGA 1260 

ATTAAAAG AG 132 0 

GAAACAGATT 13 80 

AACAGGTGAT 1440 

TTCCGAGTCT 1500 

TTGTGCCAGA 15 60 

TCCCAGTGTA 1620 

TCCTCCTGCA 1680 

CTCAGAAAGC 1740 

AATTGAACCC 18 00 

TAACCCAGAA 18 6 0 

TGAGATAATG 1920 

TCTAGATGTA 1980 

TCTCAGCATC 2 04 0 

TGGCTTCTCT 2100 

TCCTGAGAAA 2160 

TT CACAGT AT 222 0 

GTGTATAGAA 2280 

TGAGGATTAC 2340 

GGCGCCAAGA 2400 

GGACTTTTAT 2 460 

CAGCTGTTAT 252 0 

CCTTCAGGAT 2580 

TTATAACCTT 2640 

GAGTCCAAGG 27 00 

CAATCAAGCT 2760 

TGTTTTTACC 2820 

TAACTGTTCT 2 880 

ATTGTTCAAG 2940 

TATTTCTGAG 3 000 

CAATGATGAG 3 060 

TGACACTACA 3120 

TCCTGGGGCT 3180 

AGCAATGGTT 3240 

TTTAGATGCA 3 3 00 

TATTTTTTAT 3 3 60 

TTATTCTAAA 3420 

TTTCCCTGTA 34 80 

TTGTAAATAA 3540 



60 



Seq ID NO: 261 Protein sequence: 
Protein Accession #: NP_001202 



65 



70 



75 



80 



MAAVKKEGGA 
AFEYEIRFYT 
FLNLWLKLGR 
QKAEPLERLQ 
PIIRVGGALK 
PRAKENELQA 
SINHILSTRK 
RKKLKEQREA 
QIASESQKIP 
NKSPPADPPR 
ICPNPEDTCD 
SQTLSIKKLS 
PWCSQYRRQL 
FWVAPRNSAE 
CFTLQDLLQH 
NKNNQALKIV 
HLLLFKEHLQ 
GVFDTTFQSH 



11 
I 

LSEAMSLEGD 
GNDPLDVWDR 
LCNEPLDMYS 
SQHRQFQARV 
APSQNRGLQN 
GPWNTGRSLE 
PGKEEGDPLQ 
ELLTSAEKRA 
GMTLSSSVCQ 
VLAQRRPIiAV 
FARAARFVST 
PIIEDSREAT 
LKSLPELSAS 
LTVIKVSSQP 
SEYITHEITV 
DFSYSVDLRV 
VFWDGSFWKL 
LNKALWKVGK 



21 
I 

EWELSKENVQ 
YISWTEQNYP 
YLHNQGIGVS 
SRQTLLALEK 
PFPQQMQNNS 
HRPRGNTASL 
RVQSHQQASE 
EMQKQIEEME 
VNCCARETSIi 
LKTSESITSN 
PFHEIMSLKD 
HSSGFSGSSA 
AELC I EDRPM 
VPWDFYINLK 
LIIYNLLTIV 
QLDVFTLSGF 
SQNISELKDG 
LTSPGALLFQ 



31 

I 

PLRQGRIMST 
QGGKESNMST 
LAQFYISWAE 
EEEEEVFESS 
RITVFDENAD 
IAVPAVIiPSF 
EKKEKMMYCK 
KKLKEIQTTQ 
AENIWQEQPH 
EDVSPDVCDE 
LPSDPERLIjP 
SVASTSSIKC 
PKLEIEKEIE 
LKERLNEDFD 
EMLHKAEIVH 
RTVQILEGQK 
ELWNKFFVRI 



41 

I 

LQGALAQESA 
LLERAVEALQ 
EYEARENFRK 
VPQRSTLAEIj 
EASTAELSKP 
TPYVEETAQQ 
EKIYAGVGEF 
QERTGDQQEE 
SKGPSVPFSI 
FTGIEPLSED 
EEDLDVKTSE 
LQIPEKLELT 
LGNEDYCIKR 
HFCSCYQYQD 
GDLSPRCLIL 
ILANCSSPYQ 
LNANDEATVS 



51 

I 

CNNTLQQQKR 60 

GEKRYYSDPR 12 0 

ADAIFQEGIQ 180 

KSKGKKTARA 240 

TVQPWIAPPM 3 00 

PVMTPCKIEP 3 60 

SFEEIRAEVF 420 

TMPTKETTKL 480 

FDEFLIiSEKK 540 

AIITGFRNVT 600 

DQQTACGTIY 660 

NETSENPTQS 72 0 

EYLICEDYKL 780 

GCIVWHQYIN 840 

RNRIHDPYDC 900 

VDLFGIADLA 960 

VLGELAAEMN 1020 



85 



Seq ID NO: 2 62 DNA sequence 
Nucleic Acid Accession #: NM_003784 
Coding sequence: 365.. 1507 



11 



21 



31 



41 



51 



j 



287 



10 



15 



20 



25 



30 



35 



40 



WO 02/086443 

I I 

GTCTACTTAT CAATAAGCAG 
TAAAACTGAA TTCTCAGAAT 
ATTAGGTAGT GGTAAAACAG 
TGTACAGGGA AGCTCTCCTT 
CAACAGT CTT GAGAAGT GTG 
AAGGAAACCA GATTCCCATC 
TGCAATGGCC TCCCTTGCTG 
GGATGACAAT CAAGGAAATG 
GGCCCTGGTC CGCTTGGGCG 
TGTTAACACT GCCTCAGGAT 
ACTGAAAAGA GTTTTTTCTG 
GAATGGGCTT TTTGCTGAAA 
AAAATTATAC GATGCCAAAG 
ACGTAATATT AATAAGTGGG 
TGAAGGTGGC ATAAGCTCAT 
CAAGTGGCAA TCAGCCTTCA 
GTGCTCTGGG AAGGCAGTCG 
TGAGGACCCA TCAATGAAGA 
TCTGCTGCCT GAGAATGACC 
GGAATGGACC AATCCAAGGC 
CAAGATAGAG AAGAATTATG 
CTTTGATGAA T CCAAAG C AG 
AAGGATGATG CACAAATCTT 
CACAGGAAGT AATATTGTAG 
CCCATTCCTA TTTGTTATCA 
CCCTTGAAAA TCCAATTGGT 
AAGTCAATAG ATYTGRGTTT 
CTAACATTGG TCAGCAGATG 
TCCTGATCCC TGCTCTTAGC 
TCTTTCTTCC CACGCTCATT 
RGTGCTCAAC TGGTAAGGAG 
AGTTATCGCA GATATTCTAG 
CTAGAAATAA GTGTGAAGGA 
CTTCATATGT TTGATTTTAA 
ATTAGGGACC TACCAAAATA 
TGATAAGACA AT AT GTACAT 
GTTATCTACA GAATCATATT 
AGAATAAAGA AATACAACAT 



PCT/US02/12476 



CTGCCTGTGC 
TTTAGAACAA 
GCTCCCTTCG 
CATCACCTTC 
GAAACATTTT 
ACTGCTTCTG 
CAGCAAATGC 
GAAATGTGTT 
CTCAAGATGA 
ATGGAAACTC 
ATATAAATGC 
AAGTGTATGG 
TGGAGCGAGT 
TTGAAAATGA 
CTGCTGTAAT 
CCAAGAGCGA 
CCATGATGCA 
TTCTTGAGCT 
TCTCTGAAAT 
GAATGACCTC 
AAATGAAACA 
ATCTCTCTGG 
ACATAGAGGT 
AAAAGCAACT 
GGAAGGATGA 
TTCTGTTATA 
AATTGGAAAA 
ACACTGGTGA 
ATTCTACCAC 
TCTATCATTC 
AACGTAGAAG 
CTTCATTGTA 
TAAATTTTCT 
AT CAGTGTAT 
TTTCATTAAT 
GTTTTTTCAA 
TCATATGCTG 
ACCTGTAAA 



AGAGTGCAGG 
ATTTTTGTCT 
AAGCTCTCCT 
CTAAGTGCAT 
CTTTGTGAGT 
GGTATCAGAT 
AGAGTTTTGC 
CTTTTCCTCT 
CTCCCTCTCT 
TTCTAATAGT 
ATCCCACAAG 
CTTT CATAAG 
TGACTTTACG 
AACACATGGC 
GGTGCTGGTG 
AACCATAAAT 
TCAGGAACGG 
CAGATACAAT 
TGAAAACAAA 
TAAGTATGTT 
ATATTTGAGA 
GATTGCTTCG 
CACTGAGGAG 
CCCTCAGTCC 
CATCATCTTA 
GCAGTCCCCA 
ATGTGGTGTT 
CTTGACCCTT 
CATGTGTCTC 
TCCCCCATGA 
TAGCCCTAGG 
AGCAAT CTAG 
TTGTTGACCT 
AATCTAGATG 
GCTTTCAATT 
ATATTAAAGA 
TGTAGTTTAT 



CTGCACCTTT 
AGAAATGCTG 
TCATCACCTT 
GGGGGAAAAT 
GAGAACAGAT 
GCTAGCGCTG 
TTCAACCTGT 
CTGAGCCTCT 
CAGATTGATA 
CAGTCAGGGC 
GATTATGATC 
GACTACATTG 
AATCATTTAG 
AAAATCAAGA 
AATGCTGTGT 
TGCCATTTCA 
AAGTTCAATT 
GGTGGCATAA 
CTGACCTTTC 
GAGGTATTTT 
GCCCTAGGGC 
GGGGGTCGTC 
GGCACCGAGG 
ACGCTGTTTA 
TTCAGTGGCA 
CAACATCAAA 
TCCTTTGAGT 
CCTAGACACC 
ACCCATTTCT 
CCCGTCTGGA 
GATCCTTTTT 
GAAATAAGCC 
ATGAAGATTT 
GTAAAAAATG 
GACAAATTTT 
TCTTTTAACT 
AAGTTTTTCC 



GGACAGCCTT 60 

ACTTTGGTTC 120 

CCTAAGTGCA 180 

ACCTAGGGCT 240 

CACCTAGAGA 300 

CACTCCATTT 3 60 

TCAGAGAGAT 420 

TCGCTGCCCT 480 

AGTTGCTTCA 540 

TCCAGTCTCA 600 

TCAGCATTGT 660 

AGTGTGCCGA 720 

AAGACACTAG 780 

ACGTGATTGG 840 

ACTTCAAAGG 900 

AATCTCCCAA 960 

TGTCTGTTAT 1020 

ACATGTACGT 1080 

AGAATCTAAT 1140 

TTCCTCAGTT 1200 

TGAAAGATAT 12 60 

TGTATATATC 1320 

CTACTGCTGC 13 80 

GAGCTGACCA 1440 

AAGTTTCTTG 1500 

GRACCACCAC 1560 

TTATTTCTTC 1620 

TGGTTGATTG 1680 

AATTTCATTG 1740 

AATTATGGAG 1800 

GAAACTCTAC 1860 

CTGCTGCTTT 192 0 

TAGAGTTTAC 1980 

TGAAATTGGG 2040 

GGCCTTTCTT 210 0 

GTTGGCAGTT 2160 

TCTATTTATC 2220 



Seq ID NO: 2 63 Protein sequence: 
Protein Accession #: NP 003775 



45 



50 



55 



60 



65 



70 



75 



80 



MASLAAANAE 
NTASGYGNSS 
LYDAKVERVD 
WQSAFTKSET 
LPENDLSEIE 
DESKADLSGI 
FLFVIRKDDI 



11 

I 

FCFNLFREMD 
NSQSGLQSQL 
FTNHLEDTRR 
INCHFKSPKC 
NKLTFQNLME 
ASGGRLYISR 
ILFSGKVSCP 



21 



DNQGNGNVFF 
KRVFSDINAS 
NINKWVENET 
SGKAVAMMHQ 
WTNPRRMTSK 
MMHKSYIEVT 



31 
I 

SSLSLFAALA 
HKDYDLS I VN 
HGKIKNVIGE 
ERKFNLSVIE 
YVEVFFPQFK 
EEGTEATAAT 



41 



51 



JjVRLGAQDDS 
GLFAEKVYGF 
GGISSSAVMV 
DPSMKILELR 
I EKNYEMKQY 
GSNIVEKQLP 



LSQIDKLLHV 
HKDYIECAEK 
LVNAVYFKGK 
YNGGINMYVL 
LRALGLKDIF 
QSTLFRADHP 



Seq ID NO: 2 64 DNA sequence 
Nucleic Acid Accession #: AB052906 
Coding sequence: 74-814 



I 

AAAACCTTGA 
CTCTGGGTCC 
GCTCCTGCTG 
CATCACCGTC 
GGATGAAAAG 
CCTGGGGAAG 
GGTGGTGGAC 
GGAACCCCTC 
TGGAT CTTGG 
AATGTGGACA 
GGTTGTGGCC 
CTTCTTGATG 
CTCAGGCACA 
CATCCTCCCC 
AAGCTGATAC 
CCAGCTGCCC 
TGGACCCAAT 
TACCTAACAT 
TTCTGGCTGA 
GTACTTCTTT 
TAGACTT CAG 
ATAAGAAAAA 
TTTAAATAAA 



11 

I 

GGTGATT CAT 
TTAATGGCAG 
TCCGGCTGGT 
ATCCCTAAGT 
ACTTTTCTTC 
AAACTAAATG 
ATACTTACAG 
ACCCTGCAGG 
CAGTTCAGTT 
ACGGTT CAT C 
ATGTCCTTCC 
GGCATGGACA 
ACCCAACTCA 
TGCTTCATCC 
CAAAAGGCT C 
ACGACCTACG 
AGCTCATTCA 
ATTATGCAAT 
CTAAACAAGA 
GAATGATGAT 
ACCTCTGGGG 
ATTTATATTA 
GAGTTCTATT 



21 



CTTCCAGGCT 
CAGCCGCCGC 
CCCGGGCTGG 
TCAGACCTGG 
ACTATGACTG 
TCACAACGGC 
AGCAACTGCG 
CCAGGATGTC 
TCGATGGGCA 
CTGGAGCCAG 
ATTACTTCTC 
GCACCCTGGA 
GGGCCACAGC 
TCCCTGGCAT 
CTGTGAGCAC 
GTGTATGTCC 
CTGCCTTGAT 
TTTCTCTTGG 
TATATCATTT 
CTCTTTCTTG 
ATT CTTT CCG 
ATGATTGTTT 
TCCCAAAAAA 



31 
I 

CTCCTTCCAT 
TACCAAGATC 
GCGAGCCGAC 
ACCACGGTGG 
TGGCAACAAG 
CTGGAAAGCA 
TGACATT CAG 
TTGTGAGCAG 
GATCTTCCTC 
AAAGATGAAA 
AATGGGAGAC 
GCCAAGTGCA 
CACCACCCTC 
CTGAGGAGAG 
GGTCTTGATC 
AGTGGCCTCC 
TCCTTTTGCC 
TGCTACCTGA 
TCTTTCTTCT 
CAAATGATAT 
TGTCCTGAAA 
CCTTTAGTAA 
AAAAAAAAAA 



41 



CAAGTCTCTC 
CTTCTGTGCC 
CCTCACTCTC 
TGTGCGGTTC 
ACAGTCACAC 
CAGAACCCAG 
CTGGAGAATT 
AAAGCTGAAG 
CTCTTTGACT 
GAAAAGTGGG 
TGTATAGGAT 
GGAGCACCAC 
ATCCTTTGCT 
TCCTTTAGAG 
AAACTCGCCC 
AGCAGATCAT 
AACAATTTTA 
TGGAATTCCT 
CTTTTTGTTT 
TGTCAGTAAA 
GAGAATTTTT 
TTTATTGTTC 
A 



51 
I 

CTCCCTAGCG 
TCCCGCTTCT 
TTTGCTATGA 
AAGGCCAGGT 
CTGTCAGTCC 
TACTGAGAGA 
ACACACCCAA 
GACACAGCAG 
CAGAGAAGAG 
AGAATGACAA 
GGCTTGAGGA 
TCGCCATGTC 
GCCTCCTCAT 
TGACAGGTTA 
TTCTGTCTGG 
GATGACATCA 
CCAGCAGTTA 
GCACTTAAAG 
GGAAAATCAA 
AT AAT CACGT 
AAATTATTTA 
TGTACTGATA 



60 
120 
180 
240 
300 
360 



1 60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
72 0 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 



85 



Seq ID NO: 265 Protein sequence: 
Protein Accession #: BAB61048.1 



288 



WO 02/086443 

1 11 21 31 41 51 

I I I I I I 

MAAAAATKIL LCLPLLDLLS GWSRAGRADP HSLCYDITVI PKFRPGPRWC AVQGQVDEKT 
FLHYDCGNKT VTPVSPLGKK LNVTTAWKAQ NPVLREWDI LTEQLRDIQL ENYTPKEPLT 
LQARMSCEQK AEGHSSGSWQ FSFDGQIFLL FDSEKRMWTT VHPGARKMKE KWENDKWAM 
SFHYFSMGDC IGWLEDFLMG MDSTLEPSAG APLAMSSGTT QLRATATTIiI LCCLLIILPC 
FILPGI 

Seq ID NO: 2 66 DNA sequence 

Nucleic Acid Accession #: XM_084853.1 

Coding sequence: 127-444 

1 11 21 31 41 51 

I I I I I I 

ATTGATGATA TATTTAACGA AATCAAATTT GGTGAATATG TGGACACTGG AAAGCTAATC 
GACAAGATCA ACTTACCAGA TTTCCTAAAA GTGTACCTTA ACCACAAGCC ACCTTTTGGT 
AACACCATGA GTGGCATCCA CAAGAGCTTT GAGGTGCTCG GTTATACCAA CTCCAAAGGG 
AAAAAGG CCA TTCGAAGAGA GGACTTCCTG AGACTGCTCG TTACTAAAGG TGAG CATATG 
ACGGAGGAGG AGATGTTGGA TTGCTTTGCT TCACTGTTTG GCCTGAATCC CGAGGGATGG 
AAATCCGAGC CTGCAACCTG CT CCGTCAAA GGTTCAGAAA TTTGCCTTGA AGAAGAACTT 
CCAGACGAAA T CACTGCAG A AATATTCGCG ACTGAAATTC TTGGCTTAAC CATTTCAGAA 
GATTCCGGCC AGGATGGTCA GTGAAGTTAC CAGGAATGTT TAAAGCACAA AGGACTTTGG 
GTGTGTGTGC ATGCACATGT GTGTGTTTTC CATGAGGCAC TGCTTTTTAT GCATTTCCCT 
CCCCCCTCTC ATCTTTAGAA CATTTAGACA TTAAAG CAAG TTTCTGGTGA GCAATG 



Seq ID NO: 267 Protein sequence: 
Protein Accession #: XP_084853.1 

1 11 21 31 41 51 

I I I I I I 

MSGIHKSFEV LGYTNSKGKK AIRREDFLRL LVTKGEHMTE EEMLDCFASL FGLNPEGWKS 

EPATCSVKGS EICLEEELPD EITAEIFATE ILGLTISEDS GQDGQ 

Seq ID NO: 268 DNA sequence 
Nucleic Acid Accession ft: NM_001898 
Coding sequence: 57-4 82 

1 11 21 31 41 51 

I I I I I I 

GGCTCTCACC CTCCTCTCCT GCAGCTCCAG CTTTGTGCTC TGCCTCTGAG GAGACCATGG 
CCCAGTATCT GAGTACCCTG CTGCTCCTGC TGGCCACCCT AGCTGTGGCC CTGGCCTGGA 
GCCCCAAGGA GGAGGATAGG ATAAT CCCGG GTGGCATCTA TAACGCAGAC CTCAATGATG 
AGTGGGTACA GCGTGCCCTT CACTTCGCCA TCAGCGAGTA TAACAAGGCC ACCAAAGATG 
ACTACTACAG ACGTCCGCTG CGGGTACTAA GAGCCAGGCA ACAGACCGTT GGGGGGGTGA 
ATTACTTCTT CGACGTAGAG GTGGGCCGCA CCATATGTAC CAAGTCCCAG CCCAACTTGG 
ACACCTGTGC CTTCCATGAA CAGCCAGAAC TGCAGAAGAA ACAGTTGTGC TCTTTCGAGA 
TCTACGAAGT TCCCTGGGAG AACAGAAGGT CCCTGGTGAA ATCCAGGTGT CAAGAATCCT 
AGGGATCTGT GCCAGGCCAT TCGCACCAGC CACCACCCAC TCCCACCCCC TGTAGTGCTC 
CCACCCCTGG ACTGGTGGCC CCCACCCTGC GGGAGGCCTC CCCATGTGCC TGCGCCAAGA 
GACAGACAGA GAAGGCTGCA GGAGTCCTTT GTTGCTCAGC AGGGCGCTCT GCCCTCCCTC 
CTTCCTTCTT GCTTCTAATA GCCCTGGTAC ATGGTACACA CCCCCCCACC TCCTGCAATT 
AAACAGTAGC ATCGCC 

Seq ID NO: 269 Protein sequence: 
Protein Accession # :NP_001889 . 1 

1 11 21 31 41 51 

1 1 1 I I I 

MAQYLSTLLL LLATLAVALA WSPKEEDRII PGGIYNADLN DEWVQRALHF AISEYNKATK 
DDYYRRPLRV LRARQQTVGG VNYFFDVEVG RTICTKSQPN LDTCAFHEQP ELQKKQLCSF 
EIYEVPWENR RSLVKSRCQE S 

Seq ID NO: 270 DNA sequence 
Nucleic Acid Accession #: XM_0 93210 
Coding sequence: 13-1854 

1 11 21 31 41 51 

I I I I I I 

ATGGCAAGCG CCGGAATCTC CTCAGCTGCC GTTTCACAAA AGAGGTACCA GGTCCGCACC 

AAACGAGCAC ACAAGCAGCA CCAGGAGCTG CAGAAGAAGG AGGCGGCAGC GATGGACCAG 

GGCAGAGGGA ATGGGGAGGG GGCATCCTAC CCCATATCTG AGGTGCGACT GCGGGACGTA 

GAGCGGACTG GGCCTTTCCC GTTGGCGCGT GGCCTCAATC AGGACTTCTT GCCCACGTGC 

GCCTTCAAAA CGGTAAGAGC TGCAACTGAA CGTGTGAGAC ATGGTGCAGA TAGGCTGAGA 

GGCGGCGGGA GAGATGCCCA TGAACTCAAG TACCCGGACA CGCCCTCCAC TTCTACCACC 

ACGAGTAACA CCGCCCCCAC GGGACCGCTC TCGAGGTCCC CCAAGCCAAG GACGCAAGGA 

GGAACGCCCC GGCGCGCGGC CAGCAGCGGC GGGCACCGGC CCAATGGCCA CGGAACTCAG 

CACTGGCAGT CGGCCCTCCT CACACCGCAG GCGTGCAGTG TGGCCGACGG AGCCTCCCGG 

GCCGAGGACC CAGCTAGGCC GTCACCCCGG TTGCTCCCAC GGGAAGGGGC ACCAGGCAAA 

CTGCCCAAGG CCCCGAGCCC AGGCTCCCTG GCGGAGGCCT CCGCTGGTCC CGCCCAGATC 

ATGGCCGCCA CCAGGCTCCC GAGCCATGGC TTCCTGTCCG GGAACGGCCC GGCGTCCTGG 

CTGTCCAGCT AG 

Seq ID NO: 271 Protein sequence: 
Protein Accession #: XP_093210 

1 11 21 31 41 51 



289 



WO 02/086443 

1 1 I I I I 

MLRHGEQKRK RARKKWDFLP TCAFKTVRAA TERVRHGADR LRGGGRDAHE LKYPDTPSTS 
TTTSNTAPTG PLSRSPKPRT QGGTPRRRPA AAGTRANGHG TQHWQSAIiLT PQACSVADGA 
SRAEDPARPS PRLLPREGAP GKLPKAPSPG SLAEASAGLL AHVRLQNADA QRVSISQALP 
PNSSVGRKEE RPGAGQQRRA PAPMATELST GSRPSSHRRR AVWPTEPPGP RTQLEPSPRL 
LPREGAPGKL PKAPSPGSLA EASAGPAQIM AATRLPSRGF LSGNGPASWL SS 

Seq ID NO: 272 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..732 

1 11 21 31 41 51 

l I l l l l 

GGATACTGTG TCACTCAAAG TAATGGGAGG GAGAGAGAAC AGGGAGGGTA GGGATGCTTT 

TGAAAAAGCT TTTTTTCCCA CTTTTAACTT GCTTTAGCGT TAAGAGTACT TACCAGCTAA 

TAATGTGGAG GAAATTATTC TTTCTCATTG GAGATTACAG AATATATCTA TTCATCTTGA 

ATACCCACTT GAAGCCTCTG TAGAAATGTC TCGTCCTCCG GTTGTATTTC TAAAACCTAC 

ATGATTTTGT CTTGTTTCTG CAGTGAGAAA TTACATCCAT AGCAAAGACA AAAGTCTTTT 

TAAATTATTT TTATTTATCT TTCATATAGT TCTTACAATT TCTAAAAAAT TAACACTCAT 

TTAGTATCAC AATTTATGGG AGAGGGTTTT TTGTATTTTT AAGCATATGT GG CTTAT AT A 

AAAATTG C AG AAGT CAT AGG ACTGTCATGT ATTGCAGCTC TGAGAACCAA TGCCTGAAAC 
TTAAGCC 



Seq ID NO: 273 Protein sequence: 
Protein Accession #: Eos sequence 

1 11 21 31 41 51 

'ill 

MGGRENREGR DAFEKAFFPT FNLL 

Seq ID NO: 274 DNA sequence 

Nucleic Acid Accession #: NM_003 976.2 

Coding sequence: 2 9 9-961 

1 11 21 31 41 51 

I I I I I I 

CTCTGAGCTT CTCTGAGCCT TGTTTGCTCA TCTGGAAAAA GGGGATTAAA CCATTTACCT 

CATGGAGTTG TGAAAGAATA GCTGCAAAGC ACCTAACACA TAGTAAGGTT CCCAGTGCAG 

CTACTTCTGC TGGGTTGAGT CTAGCTGTGT AGGCCCCTTG TTCCTCACCT GGAGAAACTG 

GGGTGGCAGG CCGGTCCCCC ACAAAAGATA ACTCATCTCT TAATTTGCAA GCTGCCTCAA 

CAGGAGGGTG GGGGAACAGC T CAACAATGG CTGATGGGCG CTCCTGGTGT TGATAGAGAT 

GGAACTTGGA CTTGGAGGCC TCTCCACGCT GTCCCACTGC CCCTGGCCTA GGCGGCAGCC 

TGCCCTGTGG CCCACCCTGG CCGCTCTGGC TCTGCTGAGC AGCGTCGCAG AGGCCTCCCT 

GGGCTCCGCG CCCCGCAGCC CTGCCCCCCG CGAAGGCCCC CCGCCTGTCC TGGCGTCCCC 

CGCCGGCCAC CTGCCGGGGG GACGCACGGC CCGCTGGTGC AGTGGAAGAG CCCGGCGGCC 

GCCGCCGCAG CCTTCTCGGC CCGCGCCCCC GCCGCCTGCA CCCCCATCTG CTCTTCCCCG 

CGGGGGCCGC GCGGCGCGGG CTGGGGGCCC GGGCAGCCGC GCTCGGGCAG CGGGGGCGCG 

GGGCTGCCGC CTGCGCTCGC AGCTGGTGCC GGTGCGCGCG CTCGGCCTGG GCCACCGCTC 

CGACGAGCTG GTGCGTTTCC GCTTCTGCAG CGGCTCCTGC CGCCGCGCGC GCTCTCCACA 

CGACCTCAGC CTGGCCAGCC TACTGGGCGC CGGGGCCCTG CGACCGCCCC CGGGCTCCCG 

GCCCGTCAGC CAGCCCTGCT GCCGACCCAC GCGCTACGAA GCGGTCTCCT TCATGGACGT 

CAACAGCACC TGGAGAACCG TGGACCGCCT CTCCGCCACC GCCTGCGGCT GCCTGGGCTG 

AGGGCTCGCT CCAGGGCTTT GCAGACTGGA CCCTTACCGG TGGCTCTTCC TGCCTGGGAC 

CCTCCCGCAG AGTCCCACTA GCCAGCGGCC TCAGCCAGGG ACGAAGGCCT CAAAGCTGAG 

AGGCCCCTAC CGGTGGGTGA TGGATATCAT CCCCGAACAG GTGAAGGGAC AACTGACTAG 

CAGCCCCAGA GCCCTCACCC TGCGGATCCC AGCCTAAAAG ACACCAGAGA CCTCAGCTAT 

GGAGCCCTTC GGACCCACTT CTCACAGACT CTGGCACTGG CCAGGCCTCG AACCTGGGAC 

CCCTCCTCTG ATGAACACTA CAGTGGCTGA GGCATCAGCC CCCGCCCAGG CCCTGTAGGG 

ACAGCATTTG AAGGACACAT ATTGCAGTTG CTTGGTTGAA AGTGCCTGTG CTGGAACTGG 

CCTGTACTCA CTCATGGGAG CTGGCCCC 

Seq ID NO: 275 Protein sequence: 
Protein Accession #: NP_003 967.1 

1 11 21 31 41 51 

I I I I I I 

MELGLGGLST LSHCPWPRRQ PALWPTLAAL ALLSSVAEAS LGSAPRSPAP REGPPPVLAS 

PAGHLPGGRT ARWCSGRARR PPPQPSRPAP PPPAPPSALP RGGRAARAGG PGSRARAAGA 

RGCRLRSQLV PVRALGLGHR SDELVRFRFC SGSCRRARSP HDLSLASLLG AGALRPPPGS 

RPVSQPCCRP TRYEAVSFMD VNSTWRTVDR L S AT ACGCLG 

Seq ID NO: 276 DNA sequence 

Nucleic Acid Accession #: NM_057091.1 

Coding sequence: 783-1445 

1 11 21 31 41 51 

I I I I I I 

ACTGGCCGCT GAGAGAAGAA TCGGGTGGAG CAGAGAGCAG CTGCTGCAGG GCAGACAGCC 

GGACCCCCAA ATCTGCACGT ACCAGCAGTC AGCCGCCCCA CGCAGGGACC GGCTTACCCC 

TCGCTCCCCG CCCTCACTCA CTTTCTCCCG CCCTCGGCCC GGCCTCCCAG CTCTCTACTT 

CGCGTGTCTA CAAACTCAAC TCCCGGTTTC CGTGCCTCTC CACCGCTCGA GTTCTCTACT 

CTCCATATCC GAGGGGCCCC TCCCAGCATC TACCCCCCTC CCAACCTCGG GGGACCTAGC 

CAAGCTAGGG GGGACTGGAT CCGACGGGTG GAGCAGCCAG GTGAGCCCCG AAAGGTGGGG 

CGGGGCAGGG GCGCTCCCAG CCCCACCCCG GGATCTGGTG ACGCTGGGGC TGGAATTTGA 

CACCGGACGG CTGCGGCGGC GGGCAGGAGG CTGCTGAGGG ATGGAGTTGG GCCCGGCCCC 

CAGACAAGGC CCGGGGGCTC CGCCAGCAGC AGGTCCCTCG GGCCCCAGCC CTCGCTGCCA 



290 



WO 02/086443 

CCCGGGCCTG GAGCCCCACA CCCGAGGGTG CAGACTGGCT GCCAAGGCCA CACTTTTGGC 
TAAAAGAGGC ACTGCCAGGT GTACAGTCCT GGGCATGCGC TGTTTGAGCT TCGGGGGAGA 
GCCCAGCACT GGTCCCCGGA AAGGTGCCTA GAAGAACAAG GTGCAGGACC CCGTGCTGCC 
TCAACAGGAG GGTGGGGGAA CAGCTCAACA ATGGCTGATG GGCGCTCCTG GTGTTGATAG 
AGATGGAACT TGGACTTGGA GGCCTCTCCA CGCTGTCCCA CTGCCCCTGG CCTAGGCGGC 
AGCCTGCCCT GTGGCCCACC CTGGCCGCTC TGGCTCTGCT GAGCAGCGTC GCAGAGGCCT 
CCCTGGGCTC CGCGCCCCGC AGCCCTGCCC CCCGCGAAGG CCCCCCGCCT GTCCTGGCGT 
CCCCCGCCGG CCACCTGCCG GGGGGACGCA CGGCCCGCTG GTGCAGTGGA AGAGCCCGGC 
GGCCGCCGCC GCAGCCTTCT CGGCCCGCGC CCCCGCCGCC TGCACCCCCA TCTGCTCTTC 
CCCGCGGGGG CCGCGCGGCG CGGGCTGGGG GCCCGGGCAG CCGCGCTCGG GCAGCGGGGG 
CGCGGGGCTG CCGCCTGCGC TCGCAGCTGG TGCCGGTGCG CGCGCTCGGC CTGGGCCACC 
GCTCCGACGA GCTGGTGCGT TTCCGCTTCT GCAGCGGCTC CTGCCGCCGC GCGCGCTCTC 
CACACGACCT CAGCCTGGCC AGCCTACTGG GCGCCGGGGC CCTGCGACCG CCCCCGGGCT 
CCCGGCCCGT CAGCCAGCCC TGCTGCCGAC CCACGCGCTA CGAAGCGGTC TCCTTCATGG 
ACGT CAACAG CACCTGGAGA ACCGTGGACC GCCTCTCCGC CACCGCCTGC GGCTGCCTGG 
GCTGAGGGCT CGCTCCAGGG CTTTGCAGAC TGGACCCTTA CCGGTGGCTC TTCCTGCCTG 
GGACCCTCCC GCAGAGTCCC ACTAGCCAGC GGCCTCAGCC AGGGACGAAG GCCTCAAAGC 
TGAGAGGCCC CTACCGGTGG GTGATGGATA TCATCCCCGA ACAGGTGAAG GGACAACTGA 
CTAGCAGCCC CAGAGCCCTC ACCCTGCGGA TCCCAGCCTA AAAGACACCA GAGACCTCAG 
CTATGGAGCC CTTCGGACCC ACTTCTCACA GACTCTGGCA CTGGCCAGGC CTCGAACCTG 
GGACCCCTCC TCTGATGAAC ACTACAGTGG CTGAGGCATC AGCCCCCGCC CAGGCCCTGT 
AGGGACAGCA TTTGAAGGAC ACATATTGCA GTTGCTTGGT TGAAAGTGCC TGTGCTGGAA 
CTGGCCTGTA CTCACTCATG GGAGCTGGCC CC 

Seq ID NO: 2 77 Protein sequence: 
Protein Accession #: NP_003 967.1 

1 11 21 31 41 SI 

I | I I I I 

MELGLGGLST LSHCPWPRRQ PALWPTLAAL ALLSSVAEAS LGSAPRSPAP REGPPPVLAS 
PAGHLPGGRT ARWCSGRARR PPPQPSRPAP PPPAPPSALP RGGRAARAGG PGSRARAAGA 
RGCRLRSQLV PVRALGLGHR SDELVRFRFC SGSCRRARSP HDLSLASLLG AGALRPPPGS 
RPVSQPCCRP TRYEAVSFMD VNSTWRTVDR LSATACGCLG 

Seq ID NO: 278 DNA sequence 

Nucleic Acid Accession #: NM_057160.1 

Coding sequence: 1-714 

1 11 21 31 41 51 

I I I I ! I 

ATGCCCGGCC TGATCTCAGC CCGAGGACAG CCCCTCCTTG AGGTCCTTCC TCCCCAAGCC 

CACCTGGGTG CCCTCTTTCT CCCTGAGGCT CCACTTGGTC TCTCCGCGCA GCCTGCCCTG 

TGGCCCACCC TGGCCGCTCT GGCTCTGCTG AGCAGCGTCG CAGAGGCCTC CCTGGGCTCC 

GCGCCCCGCA GCCCTGCCCC CCGCGAAGGC CCCCCGCCTG TCCTGGCGTC CCCCGCCGGC 

CACCTGCCGG GGGGACGCAC GGCCCGCTGG TGCAGTGGAA GAGCCCGGCG GCCGCCGCCG 

CAGCCTTCTC GGCCCGCGCC CCCGCCGCCT GCACCCCCAT CTGCTCTTCC CCGCGGGGGC 

CGCGCGGCGC GGGCTGGGGG CCCGGGCAGC CGCGCTCGGG CAGCGGGGGC GCGGGGCTGC 

CGCCTGCGCT CGCAGCTGGT GCCGGTGCGC GCGCTCGGCC TGGGCCACCG CTCCGACGAG 

CTGGTGCGTT TCCGCTTCTG CAGCGGCTCC TGCCGCCGCG CGCGCTCTCC ACACGACCTC 

AGCCTGGCCA GCCTACTGGG CGCCGGGGCC CTGCGACCGC CCCCGGGCTC CCGGCCCGTC 

AGCCAGCCCT GCTGCCGACC CACGCGCTAC GAAGCGGTCT CCTTCATGGA CGTCAACAGC 

ACCTGGAGAA CCGTGGACCG CCTCTCCGCC ACCGCCTGCG GCTGCCTGGG CTGAGGGCTC 

GCTCCAGGGC TTTGCAGACT GGACCCTTAC CGGTGGCTCT TCCTGCCTGG GACCCTCCCG 

CAGAGTCCCA CTAGCCAGCG GCCTCAGCCA GGGACGAAGG CCTCAAAGCT GAGAGGCCCC 

TACCGGTGGG TGATGGATAT CATCCCCGAA CAGGTGAAGG GACAACTGAC TAGCAGCCCC 

AGAGCCCTCA CCCTGCGGAT CCCAGCCTAA AAGACACCAG AGACCTCAGC TATGGAGCCC 

TTCGGACCCA CTTCTCACAG ACTCTGGCAC TGGCCAGGCC TCGAACCTGG GACCCCTCCT 

CTGATGAACA CTACAGTGGC TGAGGCATCA GCCCCCGCCC AGGCCCTGTA GGG AC AG CAT 

TTGAAGGACA CATATTGCAG TTGCTTGGTT GAAAGTGCCT GTGCTGGAAC TGGCCTGTAC 

TCACTCATGG GAGCTGGCCC C 

Seq ID NO: 279 Protein sequence: 
Protein Accession #: NP_476501.1 

1 11 21 31 41 SI 

I l I - l I l 

MPGLISARGQ PLLEVLPPQA HLGALFLPEA PLGLSAQPAL WPTLAALALL SSVAEASLGS 
APRSPAPREG PPPVLASPAG HLPGGRTARW CSGRARRPPP QPSRPAPPPP APPSALPRGG 
RAARAGGPGS RARAAGARGC RLRSQLVPVR ALGLGHR SDE L.VRFRFCSGS CRRARSPHDL 
SLASLLGAGA LRPPPGSRPV SQPCCRPTRY EAVSFMDVNS TWRTVDRLSA TACGCLG 

Seq ID NO: 280 DNA sequence 

Nucleic Acid Accession #: NM_057090.1 

Coding sequence : 29-715 

1 11 21 31 41 51 

I I I I I I 

CTGATGGGCG CTCCTGGTGT TGATAGAGAT GGAACTTGGA CTTGGAGGCC TCTCCACGCT 
GTCCCACTGC CCCTGGCCTA GGCGGCAGGC TCCACTTGGT CTCTCCGCGC AGCCTGCCCT 
GTGGCCCACC CTGGCCGCTC TGGCTCTGCT GAGCAGCGTC GCAGAGGCCT CCCTGGGCTC 
CGCGCCCCGC AGCCCTGCCC CCCGCGAAGG CCCCCCGCCT GTCCTGGCGT CCCCCGCCGG 
CCACCTGCCG GGGGGACGCA CGGCCCGCTG GTGCAGTGGA AGAGCCCGGC GGCCGCCGCC 
GCAGCCTTCT CGGCCCGCGC CCCCGCCGCC TGCACCCCCA TCTGCTCTTC CCCGCGGGGG 
CCGCGCGGCG CGGGCTGGGG GCCCGGGCAG CCGCGCTCGG GCAGCGGGGG CGCGGGGCTG 
CCGCCTGCGC TCGCAGCTGG TGCCGGTGCG CGCGCTCGGC CTGGGCCACC GCTCCGACGA 
GCTGGTGCGT TTCCGCTTCT GCAGCGGCTC CTGCCGCCGC GCGCGCTCTC CACACGACCT 
CAGCCTGGCC AGCCTACTGG GCGCCGGGGC CCTGCGACCG CCCCCGGGCT CCCGGCCCGT 
CAGCCAGCCC TGCTGCCGAC CCACGCGCTA CGAAGCGGTC TCCTTCATGG ACGTCAACAG 



291 



WO 02/086443 

CACCTGGAGA ACCGTGGACC 
CGCTCCAGGG CTTTGCAGAC 
GCAGAGTCCC ACTAGCCAGC 
CTACCGGTGG GTGATGGATA 
CAGAGCCCTC ACCCTGCGGA 
CTTCGGACCC ACTTCTCACA 
TCTGATGAAC ACTACAGTGG 
TTTGAAGGAC ACATATTGCA 
CTCACTCATG GGAGCTGGCC 



GCCTCTCCGC CACCGCCTGC 
TGGACCCTTA CCGGTGGCTC 
GGCCTCAGCC AGGGACGAAG 
TCATCCCCGA ACAGGTGAAG 
TCCCAGCCTA AAAGACACCA 
GACTCTGGCA CTGGCCAGGC 
CTGAGGCATC AGCCCCCGCC 
GTTGCTTGGT TGAAAGTGCC 
CC 



GGCTGCCTGG GCTGAGGGCT 
TTCCTGCCTG GGACCCTCCC 
GCCTCAAAGC TGAGAGGCCC 
GGACAACTGA CTAGCAGCCC 
GAGACCTCAG CTATGGAGCC 
CTCGAACCTG GGACCCCTCC 
CAGGCCCTGT AGGGACAGCA 
TGTGCTGGAA CTGGCCTGTA 



Seq ID NO: 281 Protein sequence: 
Protein Accession #: NP_476431.1 



1 11 21 31 41 51 

I I I I I I 

MEL.GLGGLST L.SHCPVJPRRQ APLG1>SAQPA I»WPTLAALAIi IiSSVAEASLG SAPRSPAPRE 

GPPPVLASPA GHLPGGRTAR WCSGRARRPP PQPSRPAPPP PAPPSALPRG GRAARAGGPG 

SRARAAGARG CRLRSQIiVPV RALGL.GHRSD ELVRFRFCSG SCRRARSPHD LSLASLLGAG 

AXiRPPPGSRP VSQPCCRPTR YEAVS FMDVN STWRTVDRLS ATACGCLG 



Seq ID NO: 282 DNA sequence 

Nucleic Acid Accession ft: Eos sequence 



1 11 21 31 41 51 

I l i I I l 

CTACTGCACC TGCCCTCTGT TTCCTTTGGA AATCTCTTAC CTTTCATTAG GGTTTCTTTC 
ATAGCAATTT CCTTTGGTTT TTAAGACTTC TACATTGCTT TTTCTTTTAT TATCTGTGCT 
CCGTGAACCT TATGAATGCT GCTTAAAAAT AATGTCAAAA TATGTTTTAG CTGCCTACTC 
AGGTAACGTT TTCTTTTGCT CTCATCTTGG TTTCCATATA CTATTTTTGG TTTTTTGTGA 
GATCTAATCA ATGATCTAGT CAGAAGCTAC TTCACTGGCT AACAGTGATC ATGTTCATGT 
GCTAAAAATG AACTTGAAAC ACGGAAGTAG TGGTTGGTCC AGT TTGAAAG CTCTTATTAG 
TATTCTTCAT CCTGGCTGTA ATAATAGCCA TTATTTGTTA TGCCTTTGTT ATGTAGCAGA 
CACTCTTAAG GATTTTATGT GTATTATTCA AATTGCTATT ACTGT TCTTT TTATAGTTGA 
GAATCTCAGG ATACCTACAT TTATCACTTT TTCAATATAT ATGTATTTCT TATT 



Seq ID NO: 283 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 564-1481 



1 11 21 31 41 51 

I I I I I I 

GAGACTTTTA ATCATCTATC CCTTGTGCTT TACGCAGACC CTACAATACA CTAGAGGCTT 

CAAAGAGGTC AAAAATTCAC ATGTGTAGAC AAATTAGGTC CCTTAAGATG CCAGGCAAAC 

GAAGTGCTAC CAAAACACGC AATGACTGTC CTAAAAGTGC GTTCTGGGAT ACACCTGTAA 

ACTTGGATCA AGTTCCCTCC CCTCTCCTCA AAATATATCG ACTTGTGCTG AAAGAAATCA 

CGACCGATGC TGACAATTCT GACCTCGTAA TTATATAGGG GGTGGTTTTG GTTTCTGCGT 

CTTTCCCTGA TTCAGTGGCA GGTAACATAT TTCATGTACA AAATGAACTG CAACACCACG 

GCAAACAAGG GACAGGCCCT CAAAGTTGTC GGTAGGGAGC CAGGACCCCG CCAGTGGCGT 

GGGGAGACAC CGTACTAAAC AAGCTTGCAA ACAGCAGGCA CCTTCCTGCC ACTGAGGAGG 

AAGGGCTGGC TAAGGGAGGC CGGGGCGGAG GAAGCCAAGC TCTGCAGGCC CTGACAAAGT 

CCTCCCGGCC TCCACGCGTC GCCATGGCAA CGCGGGGTCT GTGCTGGCCG GGATTGGCCG 

GCCTGGCGCG CGCAGGGCCC GCTGGGAAAG CGCGTCCCCG CCGCGGCTCC GCCAGTTTGA 

ACTTGGCGGG CCAGATGTGG GCGGCGGGGC GCTGGGGGCC TACTTTTCCC TCTTCCTACG 

CCGGTTTCTC TGCTGACTGC AGACCCAGGT CTCGGCCCTC CTCGGACTCC TGCTCAGTCC 

CTATGACGGG CGCACGTGGG CAGGGGCTGG AGGTGGTGCG CTCGCCGTCG CCGCCGCTGC 

CGCTGAGCTG CAGCAATTCC ACCAGGTCGC TGTTGTCTCC CCTTGGCCAC CAGAGCTTCC 

AGTTTGACGA GGACGACGGT GACGGGGAGG ATGAGGAAGA CGTGGATGAT GAGGAAGACG 

TGGATGAAGA TGCCCATGAT TCAGAGGCCA AAGTGGCGAG CCTGAGAGGA ATGGAGTTAC 

AGGGGTGCGC CAGCACTCAG GTTGAATCAG AAAATAACCA AGAAGAACAG AAACAGGTGC 

GCTTACCAGA AAGCCGCCTG ACACCATGGG AGGTGTGGTT TATTGGCAAA GAAAAAGAAG 

AACGTGACCG GCTGCAACTG AAAGCTCTAG AGGAATTAAA TCAACAACTA GAAAAAAGAA 

AAGAAATGGA AGAACGTGAA AAAAGAAAGA TAATTGCTGA AGAAAAGCAC AAGGAATGGG 

TTCAGAAAAA GAATGAGCAA AAAAGAAAAG AAAGAGAACA AAAAATTAAT AAAGAAATGG 

AGGAAAAAGC AG CAAAGGAA CTGGAGAAAG AATACTTGCA AGAAAAAGCA AAAGAAAAAT 

ATCAAGAATG GTTAAAGAAA AAAAATGCTG AAGAATGTGA GAGGAAGAAG AAAGAAAAGA 

AAAACAACAG CAAGCTGAAA TACAGGAGAA AAAGGAAATA GCAGAAAAAA AGTTTCAAGA 

ATGGTTGGAA AATGCGAAAC ATAAACCTCG TCCAGCTGCA AAGAGCTATG GTTATGCCAA 

TGGAAAACTT ACAGGTTTTT ACAGTGGAAA TTCCTATCCA GAACCAGCCT TTTATAATCC 

AATTCCGTGG AAACCAATTC ATATGCCACC TCCCAAAGAA GCTAAGGATC TATCAGGAAG 

GAAGAGTAAA AGACCTGTGA TAAGTCAGCC ACACAAGTCA TCATCTCTGG TAATTCATAA 

AGCCAGGAGC AATCTTTGCC TTGGAACTCT GTGCAGAATA CAAAGATAGC GTATGTGGAA 

AATAACATGC TTTTATCTGG AGCTATTTAA TTTAAAAATC AGAAATTGTT TTTTACTGCT 

CAGTCAATAA CTCAACACTT AATGTGATTA TTGACAAATA GCAATTTTTG CATTTGTATA 

TGGAGTCCTT AGAGTTGAGG AAGATATTTT CTGGATTTTG GTTTTTATAA ACTTTTTAAG 

GTTGATCTTG GCATGTTGTT TTGCAGAATA AGTGGCTGAA TATGTAAGAA TTGTGTTTGT 

ATTTAGCTTG TAT T AAAAGT ACACTGTAAT ACCAATAAAA CTAACAATTT TTCTTG 



Seq ID NO: 284 Protein sequence: 
Protein Accession #: Eos sequence 



1 11 21 31 41 51 

I 1 I I I I 

MATRGLCWPG LAGLARAGPA GKARPRRGSA SLNLAGQMWA AGRWGPTFPS SYAGFSADCR 

PRSRPSSDSC SVPMTGARGQ GLEWRSPSP PLPLSCSNST RSLLSPLGHQ SFQFDEDDGD 

GEDEEDVDDE EDVDEDAHDS EAKVASLRGM ELQGCASTQV ESENNQEEQK QVRLPESRLT 

PWEVWFIGKE KEERDRLQIjK ALEEDNQQLE KRKEMEEREK RKIIAEEKHK EWVQKKNEQK 

RKEREQKINK EMEEKAAKEL EKEYLQEKAK EKYQEWLKKK NAEECERKKK EKKNNSKLKY 



292 



WO 02/086443 



PCT/US02/12476 



RRKRK 

Seq ID NO: 285 DNA sequence 
Nucleic Acid Accession #: Eos sequence 
5 Coding sequence: 1-1746 

1 11 21 31 41 51 

I l I l l I 

ATGCCACTGA AGCATT AT CT CCTTTTGCTG GTGGGCTGCC AAGCCTGGGG TGCAGGGTTG 60 

10 GCCTACCATG GCTGCCCTAG CGAGTGTACC TGCTCCAGGG CCTCCCAGGT GGAGTGCACC 12 0 

GGGGCACGCA TTGTGGCGGT GCCCACCCCT CTGCCCTGGA ACGCCATGAG CCTGCAGATC 18 0 

CTCAACACGC ACATCACTGA ACTCAATGAG TCCCCGTTCC TCAATATCTC AGCCCTCATC 24 0 

GCCCTGAGGA TTGAGAAGAA TGAGCTGTCG CGCATCACGC CTGGGGCCTT CCGAAACCTG 3 00 

GGCTCGCTGC GCTATCTCAG CCTCGCCAAC AACAAGCTGC AGGTTCTGCC CATCGGCCTC 3 60 

15 TTCCAGGGCC TGGACAGCCT TGAGTCTCTC CTTCTGTCCA GTAACCAGCT GTTGCAGATC 420 

CAGCCGGCCC ACTTCTCCCA GTGCAGCAAC CTCAAGGAGC TGCAGTTGCA CGGCAACCAC 480 

CTGGAATACA TCCCTGACGG AGCCTTCGAC CACCTGGTAG GACT CACGAA GCTCAATCTG 540 

GGCAAGAATA GCCTCACCCA CATCTCACCC AGGGTCTTCC AGCACCTGGG CAATCTCCAG 600 

GTCCTCCGGC TGTATGAGAA CAGGCTCACG GATATCCCCA TGGGCACTTT TGATGGGCTT 660 

20 GTTAACCTGC AGGAACTGGC TCTACAGCAG AACCAGATTG GACTGCTCTC CCCTGGTCTC 720 

TTCCACAACA ACCACAACCT CCAGAGACTC TACCTGTCCA ACAACCACAT CTCCCAGCTG 780 

CCACCCAGCA TCTTCATGCA GCTGCCCCAG CTCAACCGTC TTACTCTCTT TGGGAATTCC 840 

CTGAAGGAGC TCTCTCTGGG GATCTTCGGG CCCATGCCCA ACCTGCGGGA GCTTTGGCTC 900 

TATGACAACC ACATCTCTTC TCTACCCGAC AATGTCTTCA GCAACCTCCG CCAGTTG CAG 960 

25 GTCCTGATTC TTAGCCGCAA TCAGAT CAGC TTCATCTCCC CGGGTGCCTT CAACGGG CTA 102 0 

ACGGAGCTTC GGGAGCTGTC CCTCCACACC AACGCACTGC AGGACCTGGA CGGGAATGTC 1080 

TTCCGCATGT TGGCCAACCT GCAGAACATC TCCCTGCAGA ACAATCGCCT CAGACAGCTC 1140 

CCAGGGAATA TCTTCGCCAA CGTCAATGGC CTCATGGCCA TCCAGCTGCA GAACAACCAG 12 00 

CTGGAGAACT TGCCCCTCGG CATCTTCGAT CACCTGGGGA AACTGTGTGA GCTGCGGCTG 12 60 

30 TATGACAATC CCTGGAGGTG TG ACT CAG AC ATCCTTCCGC TCCGCAACTG GCTCCTGCTC 132 0 

AACCAGCCTA GGTTAGGGAC GGACACTGTA CCTGTGTGTT TCAGCCCAGC CAATGTCCGA 13 80 

GGCCAGTCCC TCATTATCAT CAATGTCAAC GTTGCTGTTC CAAGCGTCCA TGTCCCTGAG 1440 

GTGCCTAGTT ACCCAGAAAC ACCATGGTAC CCAGACACAC CCAGTTACCC TGACACCACA 150 0 

TCCGTCTCTT CTACCACTGA GCTAACCAGC CCTGTGGAAG ACTACACTGA TCTGACTACC 1560 

35 ATTCAGGTCA CTGATGACCG CAGCGTTTGG GGCATGACCC AGGCCCAGAG CGGGCTGGCC 162 0 

ATTGCCGCCA TTGTAATTGG CATTGTCGCC CTGGCCTGCT CCCTGGCTGC CTGCGTCGGC 168 0 

TGTTGCTGCT GCAAGAAGAG GAGCCAAGCT GTCCTGATGC AGATGAAGGC ACCCAATGAG 1740 

TGTTAAAGAG GCAGGCTGGA GCAGGGCTGG GGAATGATGG GACTGGAGGA CCTGGGAATT 18 0 0 

TCATCTTTCT GCCTCCACCC CTGGGTCCAT GGAGCTTTCC CGTGATTGCT CTTTCTGGCC 18 6 0 

40 CTAGATAAAG GTGTGCCTAC CTCTTCCTGA CTTGCCTGAT TCTCCCGTAG AGAAGCAGGT 192 0 

CGTGCCGGAC CTTCCTACAA TCAGGAAGAT AGATCCAACT GGCCATGGCA AAAGCCCTGG 198 0 

GGATTTCCGA TTCATACCCC TGGGCTTCCT TCGAGAGGGC TCTTCCTCCA AATCCTCCCC 2 04 0 

ACCTGTCCTC CAAGAACAGC CTTCCCTGCG CCCAGGCCCC CTCCGGGCCT CTGTAGACTC 210 0 

AGTTAGTCCA CAGCCTGCTC ACTTCGTGGG AATAGTT CT C CGCTGAGATA GCCCCTCTCG 2160 

45 CCTAAGTATT ATGTAAGTTG ATTTCCCTTC TTTTGTTTCT CTTGTTTGTG CTATGGCTTG 222 0 

ACCCAGCATG TCCCCTCAAA TGAAAGTTCT CCCCTTGATT TTCTGCTCCT GAAGGCAGGG 22 80 

TGAGTTCTCT CCTCAAAGAA GACTTCAAAC CATTTAACTG GTTTCTTAAG AGCCGTCAAT 2340 

CAGCCTGGTT TTGGGGATGC TATGAAAGAG AGAAGGAAAA TCATGCCGCT CAGTTCCTGG 240 0 

AGACAGAAGA GCCGTCATCA GTGT CTCACT TGTGATTTTT ATCTGGAAAA GGAAGAAACA 2460 

50 CCCCAGCACA GCAAGCTCAG CCTTTTAGAG AAGGATATTT CCAAACTGCA AACTTTGCTT 2520 

TGAAAAGTTT AGCCCTTTAA GGAATGAAAT CATGTAGAAT TTTGGACTTC TAAAAACATT 25 80 

AAAATCAGCT TATTAATACG GGATAGAGAA AGAAATCTGG TGCCTGGGGG TCCCTGTGTT 2 640 

CACCCCTAGA GTTTGTTTTA AAATTTTTAA TTGAAGCATG TGAAGTGTAC STGCAGAAAA 2700 

GTGGGAACAT GATAGTGTAT GGCTTGGTGG ATTTTCACAA ACTGAACATA CCTGTGTAAT 27 60 

55 CAGCATCTAG ACCCAGACCC AGAGCATCAC AAATATCCCC CATCCTGGGC TTTTCCCAGA 2 820 

GGAGATGGGG GCTTCTGAAG ATGGACTTAC CTGGGACCTG CCCCCCATGA GCCAGGACGG 2 880 

TCCCCCCACA GTCAGCCTGT GCAAAGGCCC CGTGGCCAGG GGTGGAGGAG AATATGTGGG 2 940 

TGTGGACAGG ATGGGAGACT GTGGCCTGAA CAGGAGATTT TATTATATCT GGAGACCCTG 3 000 

AGAGACCCTG AGACCTGGGG CACCATGGCT GGCCAGGTCA GAAGCATCCT GACTGCAGAG 3 060 

60 GT C CG TG CAG CCACACCCTC TTCCCTGCCA GCAAGTTGTC TGCGGCTCAT CGGAGGCCCC 312 0 

TCCGCCTGGA GCCTTCTATG GACGTGATAT GCCTGTATCT GTTTTTAATT TTCATTCTTC 3180 

ACTTAGGGGA AGTGAAATCG CTCAGAGATG AGATCCTTTA ATTGAAAACG AAGTGTAACG 3240 

GAATCTAGTG TCTTTCTAAT GTGGTAAAAT TCTCCATCAA CATCACAGTC AGCTGGCAGC 33 0 0 

TGAACTT CAG AATCTCACTT ACAGCAGGCG ACACGGGGGT ACACCGATGG GTCACACTGG 3 3 60 

65 GTCTGGGGGC TCCCTGGAGC TCCTCCTGCG TGTGGTCTGG TTAGGAGTTG AGTTGTTTGC 3 420 

T CCAGGGTT A TTCTGCTCCT CGAGTCACAG TCACACGAAT ACCTGCCTTC TCTGGCTTTC 3 480 

CTGCTATACA CATATTCACA TGGCGCTCAA GAAGTTAGGC TCATGGCAAC GTGTGTCTTT 3 540 

CT CTGGACAA CTGGCCCAGT TTACAGTGAA ATGGAGAATT TCAGGTCTCC ACGTCTGCCC 3 600 

AGGAAAGAAC TTCAGCTGAC TCCACGGGGA TCTGGAAATC CACGACCAAT CCCGATCGGC 3 660 

70 TCTTATTAGC TCCCCGCTCC ACAAGACACC TGTGCTTTGG AAATCCACCA CCAATCCCGA 3720 

TCGGCTCTTA TTAGCTCCCC GCTCCACAAG ACACCTGTGA TCTGGAAATC TACCACCAAT 3 780 

CCCGATCGGC TCTTATTAGC TCCCCGCTCC ACAAGACACC TGTGACATCC TCCAGGGCCA 3 840 

CAG GAGCACG TGCTGACCAG TTTTCCCTTC CAGTTCCTGC ACAAAAAGTG TCCAGAGGGC 3 900 

TGTTTGCAAA CACTAGTG CA CTTTGTAGCT TTTCACCCTC TGTCCCAGGG AAT CTAGGAG 3 960 

75 AGATGAGGCC CGTCAGAGTC AAGAGATGTC ATCCCCCCAG GGTCTCCAAG GCATTTCCAC 4020 

ACTATTGGTG GCACCTGGAG GACATGCACC AAGGCTTGCC AGAGCCAACA GGAAGTGAGC 4080 

CCAGAGCATG GCACATGAGC ATCACCCGCT GATGGTGGCC TGCTGTGCCT GGTGCCAACA 4140 

GGGGCATCCC GGCCCGTACC CCTCCAGACA GGAAGCATGG GTTTGCCCAC AG ACCT GT CG 4200 

GGTGCTCCTG TGAGTGGCCT CCAGATGTCT TTGTGCATAG GCACAAGTGG GCCAGGGCTG 42 60 

80 GAGGGAGGTG GGAAACCT CA T CAT CCGGTG GGCCCTGCCA ATCTTAACCC AGAACCCTTA 4320 

GGTATTCCTG GCAGTAGCCA TGACATTGGA GCACCTTCCT CTCCAGCCAG AGGCTGACCT 4380 

GAGGGCCACT GTCCTCAGAT GACACCACCC AGGAGCACCC TAGGTGAGGG GTGAGGGCCC 4440 

CCTTATGTGA ACCTCTTGCC TCTTCCTTTC TCCCATCAGA GTGGTTGGAT GGAGCCATTG 4500 

GCCTCCTTTT CTTCAGCGGG CCCTTCAACC TCTCTGCACC ATGTTGTCTG GCTGAGGAGC 4560 

85 TACTAGAAAA GCTGAGTGGA GTCTCCTTTC CAACAGGATG ATGCATTTGC TCAATTCTCA 462 0 

GGGCTGGAAT GAGCCGGCTG GTCCCCCAGA AAGCTGGAGT GGGGTACAGA GTTCAGTTTT 4680 

CCT CTCTGTT TACAGCTCCT TGACAGTCCC ACGCCCATCT GGAGTGGGAG CTGGGAGTTA 4740 
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GTGTTGGAGA AGAAACAACA AAAGCCAATT AGAACCACTA TTTTTAAAAA GTGCTTACTG 4 800 

TGCACAGATA CTCTTCAAGC ACTGGACGTG GATTCTCTCT CTAGCCCTCA GCACCCCTGC 4860 

GGTAGGAGTG CCGCCTCTAC CCACTTGTGA TGGGGTACAG AGGCACTTGC TCTTCTGCAT 4 920 

GGTGTTCAAT AGGCTGGGAG TTTTATTTAT CTCTTCAAAC TTTGTACAAG AG CTCATGGC 4 980 

5 TTGTCTTGGG CTTTCGTCAT TAAACCAAAG GAAATGGAAG CCATTCCCCT GTTGCTCTCC 5040 

TTAGTCTTGG TCATCAGAAC CTCACTTGGT ACCATATAGA TCAAAAGCTT TGTAACCACA 5100 

GGAAAAAATA AACTCTTCCA TCCCTTAAAG AATAGAATAG TTTGTCCCTC TCATGGGAAT 5160 

TGGGCTGTAT GTATATTGTT CTTCCTCCTT AGAATTTAGA GATACAAGAG TTCTACTTAG 5220 

AACTTTTCAT GGACACAATT TCCACAACCT TTCAGATGCT GATGTAGAGC TATTGGGAAA 5280 

10 GAACTTCCAA ACTCAGGAAG TTTGCAGAGA GCAGACAGCT AGAGATAACT CGGGACCCAG 5340 

AGTTGGTCGA CAGATGTTAG ATGTATCCTA GCTTTTAGCC ATAAACCACT CAAAGATTCA 5400 

GCCCCCAGAT CCCACAGTCA GAACTGAATC TGCGTTGTTG GGAAGCCAGC AGTGGCCTTG 5460 

GGAAGGAAGC CATGGCTGTG GTTCAGAGAG GGTGGGCTGG CAAGCCACTT CCGGGGAAAA 5520 

CTCCTTCCGC CCCAGGTTTC TTCTTCTCTT AAGGAGAGAT TGTTCTCACC AACCCGCTGC 5580 

15 CTTCATGCTG CCTTCAAAGC TAG AT CATGT TTGCCTTGCT TAGAGAATTA CTGCAAATCA 5640 

GCCCCAGTGC TTGGCGATGC ATTTACAGAT TTCTAGGCCC TCAGGGTTTT GTAGAGTGTG 5700 

AGCCCTGGTG GGCAGGGTTG GGGGGTCTGT CTTCTGCTGG ATGCTGCTTG TAAT CCATTT 5760 

GGTGTACAGA ATCAACAATA AATAATATAC ATGTAT 

20 Seq ID NO: 286 Protein sequence: 
Protein Accession #: NP_570843.1 

1 11 21 31 41 51 

oc I I 1 I I 1 

2 J MPLKHYLLLL VGCQAWGAGL AYHGCPSECT CSRASQVECT GARIVAVPTP LPWNAMSLQI 60 

LNTH I TELNE SPFLNISALI ALRIEKNELS RITPGAFRNL GSLRYLSLAN NKLQVLPIGL 12 0 

FQGLDSLESL LLSSNQbLQI QPAHFSQCSN LKELQLHGNH LEYIPDGAFD HLVGLTKLNL 180 

GKNSLTHISP RVFQHLGNLQ VLRLYENRLT DIPMGTFDGL VNLQELALQQ NQIGLLSPGIj 240 

FHNNHNLQRL YLSNNHISQL PPSIFMQLPQ LNRLTLFGNS LKELSLGIFG PMPNLRELWL 300 

30 YDNHISSLPD NVFSNLRQLQ VIiILSRNQIS FISPGAFNGL TELRELSLHT NALQDLDGNV 360 

FRMLANLQNI SLQNNRLRQL PGNIFANVNG LMAIQLQNNQ LENLPLGIFD HLGKLCELRI) 42 0 

YDNPWRCDSD ILPLRNWLLL NQPRLGTDTV PVCFSPANVR GQSLIIINVN VAVPSVHVPE 480 

VPSYPETPWY PDTPSYPDTT SVSSTTELTS PVEDYTDLTT IQVTDDRSVW GMTQAQSGLA 540 
IAAIVIGIVA LACSLAACVG CCCCKKRSQA VLMQMKAPNE C 



35 



Seq ID NO: 287 DNA sequence 
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Coding sequence: 1..954 
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ATGTCTTCTG AGCAGAAGAG TCAGCACTGC AAGCCTGAGG AAGGCGTTGA GGCCCAAGAA 60 

GAGGCCCTGG GCCTGGTGGG TGCACAGGCT CCTACTACTG AGGAGCAGGA GGCTGCTGTC 12 0 

TCCTCCTCCT CTCCTCTGGT CCCTGGCACC CTGGAGGAAG TGCCTGCTGC TGAGTCAGCA 180 

45 GGTCCTCCCC AGAGTCCTCA GGGAGCCTCT GCCTTACCCA CTACCATCAG CTTCACTTGC 240 

TGGAGGCAAC CCAATGAGGG TTCCAGCAGC CAAGAAGAGG AGGGGCCAAG CACCTCGCCT 300 

GACGCAGAGT CCTTGTTCCG AGAAGCACTC AGTAACAAGG TGGATGAGTT GGCTCATTTT 360 

CTGCTCCGCA AGTATCGAGC CAAGGAGCTG GTCACAAAGG CAGAAATGCT GGAGAGAGTC 420 

ATCAAAAATT ACAAGCGCTG CTTTCCTGTG ATCTTCGGCA AAGCCTCCGA GTCCCTGAAG 480 

50 ATGATGTTTG GCATTGACGT GAAGGAAGTG GACCCCGCCA GCAACACCTA CACCCTTGTC 540 

ACCTGCCTGG GCCTTTCCTA TGATGGCCTG CTGGGTAATA ATCAGATCTT TCCCAAGACA 600 

GGCCTTCTGA TAATCGTCCT GGGCACAATT GCAATGGAGG GCGACAGCGC CTCTGAGGAG 660 

GAAATCTGGG AGGAGCTGGG TGTGATGGGG GTGTATGATG GGAGGGAGCA CACTGTCTAT 720 

GGGGAGCCCA GGAAACTGCT CACCCAAGAT TGGGTGCAGG AAAACTACCT GGAGTACCGG 780 

55 CAGGTACCCG GCAGTAATCC TGCGCGCTAT GAGTTCCTGT GGGGTCCAAG GGCTCTGGCT 840 

GAAACCAGCT ATGTGAAAGT CCTGGAGCAT GTGGTCAGGG TCAATGCAAG AGTTCGCATT 900 
GCCTACCCAT CCCTGCGTGA AGCAGCTTTG TTAGAGGAGG AAGAGGGAGT CTGA 

60 Seq ID NO: 2 88 Protein sequence: 
Protein Accession ft: NP__ 002353.1 

1 11 21 31 41 51 ' 

„ I I l ] I I 

02> MSSEQKSQHC KPEEGVEAQE EALGLVGAQA PTTEEQEAAV SSSSPLVPGT LEEVPAAESA 60 

GPPQSPQGAS ALPTTISFTC WRQPNEGSSS QEEEGPSTSP DAESLFREAL SNKVDELAHF 120 

LLRKYRAKEL VTKAEMLERV I KNYKRCF P V IFGKASESLK MIFGIDVKEV DPASNTYTLV 180 

TCLGLSYDGL LGNNQIFPKT GLLIIVLGTI AMEGDSASEE EIWEELGVMG VYDGREHTVY 240 

GEPRKLLTQD WVQENYIiEYR QVPGSNPARY EFLWGPRALA ETSYVKVLEH WRVNARVRI 300 

70 AYPSLREAAL LEEEEGV 

Seq ID NO: 289 DNA sequence 
Nucleic Acid Accession #: NMJ)02362 
^ Coding sequence: 46.. 1344 

1 . 11 21 31 41 51 
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CGGCGGCCGC GCCCTGGTTG GGTCCCCACT GCTCTCGGGG GCGCCATGGA CGAGGCCGTG 60 

80 GGCGACCTGA AGCAGGCGCT TCCCTGTGTG GCCGAGTCGC CAACGGTCCA CGTGGAGGTG 120 

CATCAGCGCG G C AG C AG C AC TGCAAAGAAA GAAGACATAA ACCTGAGTGT TAGAAAGCTA 180 

CTCAACAGAC ATAATATTGT GTTTGGTGAT TACACATGGA CTGAGTTTGA TGAACCTTTT 240 

TTGACCAGAA ATGTGCAGTC TGTGTCTATT ATTGACACAG AATTAAAGGT TAAAGACTCA 3 00 

CAGCCCATCG ATTTGAGTGC ATGCACTGTT GCACTTCACA TTTTCCAGCT GAATGAAGAT 3 60 

85 GGCCCCAGCA GTGAAAATCT GGAGGAAGAG ACAGAAAACA TAATTGCAGC AAATCACTGG 420 

GTTCTACCTG CAGCTGAATT CCATGGGCTT TGGGACAGCT TGGTATACGA TGTGGAAGTC 480 

AAATCCCAT C TCCTCGATTA TGTGATGACA ACTTTACTGT TTT CAGACAA GAACGTCAAC 540 



294 



WO 02/086443 

AGCAACCTCA TCACCTGGAA CCGGGTGGTG 
ACATCCCTGT GTAAAGCGTT AGCCCAGAAA 
TATGGCCAAT TAATTGAAAT AAACAGCCAC 
GGCAAGCTGG TAACCAAGAT GTTTCAGAAG 
CTGGTGTTCG TGCTGATTGA TGAGGTGGAG 
GCGGGCACCG AGCCATCAGA TGCCATCCGC 
CAGATTAAAA GGCATTCCAA TGTTGTGATT 
GACGTGGCCT TCGTGGACAG GGCTGACATC 
GCCATCTTCA AAATCTACCT CTCTTGTTTG 
CCTCGCCAGC AGCTGCTGAC CCTCCGAGAG 
GTGTCAAAAT TGAGCCTTCT TTTGAATGAC 
CGGGTCCTGA GAAAACTCCC CTTTCTGGCT 
ACCATAGAGG GGTTCCTCCA GGCCCTGTCT 
AAGAAGCTTG CAGCTTACAT CTGATCCTGG 
AACACACAAC CAGTAAGTGA GGTTGCCCCA 
AAACCAAACG TTACTTAGAC TGCAAGCTAG 
AAGTGTATTC TATTTATGTT GTTTTAAAAT 
T CACTGTTTG TAAAAGATAA TTCAGATTGT 
GTTTGTTCCC AGCCCACCCC CAGTGGATGG 
AGCAAAAAAG GAAGATTAAT GCAGGTGTTA 
AAAG AAG CAT ATAATCATAG CATTAAAAAT 
TTGCTTTCTG ATATCAGCTC GTTTGATTTA 
GATGTAAAAA AGCCTATTTC TAG AT TAT AC 
TCTTTCATAA TAAATAATCA AGACATGGTC 
GTTCCAGGGA AACACATGCT GGACATCCCT 
TGGGATGTTT CTGCCCACGG TTTTGTTTGT 
TTCACATTAA TATAATATAA AATAAATAGG 
ATGTTTTGCT TTTATCTCAC AGTAAAATAA 



CTGCTCCACG GTCCTCCTGG CACTGGAAAA 600 

TTGACAATTA GACTTTCAAG CAGGTACCGA 660 

AGCCTCTTTT CTAAGTGGTT TTCGGAAAGT 720 

ATTCAGGATT TGATTGATGA TAAAGACGCC 780 

AGTCTCACAG CCGCCCGAAA TGCCTGCAGG 840 

GTGGTCAATG CTGTCTTGAC CCAAATTGAT 900 

CTGACCACTT CTAACATCAC CGAGAAGATC 960 

AAGCAGTACA TTGGGCCACC CTCTGCAGCA 102 0 

GAAGAACTGA TGAAGTGTCA GATCATATAC 10 8 0 

CTAGAGATGA TTGGCTTCAT TGAAAACAAC 1140 

ATTTCAAGGA AGAGCGAGGG CCTCAGCGGC 1200 

CATGCGCTGT ATGTCCAGGC CCCCACCGTC 1260 

CTGGCAGTGG ACAAGCAGTT TGAAGAGAGA 1320 

GCTTCCCCAT CTGGTGCTTT TCCCATGGAG 13 80 

CACAGCCGTC TCCCAGGGAA TCCCTTCTGC 1440 

AAAGCCACCA AGGCCAGGCT TTGTTAAAAG 150 0 

GCATACTGAG AGACAAACAT CTTGTCATTT 1560 

TTGTCTCCTT GTGAAGAACC ATCGAAACCT 162 0 

GATGCATAAT GCCAGCAAGT TTTGTTTAAC 1680 

TAGAAGCCAG AAGAGAAACT GTGTCACCCT 174 0 

GCACACATTA CTCCAGGTGG AAGGTGGCAA 18 0 0 

GTGCAAAAAT GTTTTCAAGA CTATTTAATG 18 60 

CAACTGAGAA AAAAATGGTC GGTAAAGTGT 1920 

CCATTTGCAG GAAAAGTGCA GACTCTGAGT 1980 

TGTAACCCGG TATGGGCGCC CCTGCATTGC 2040 

GCAATAACGT TATCAC AT T T CTAATGAGGA 2100 

TCAGTTACTG GTCTCTTTCT GCCGAATGTT 2160 
ATATAATTAA AAA 



Seq ID NO : 2 90 Protein sequence: 
Protein Accession #: NP 004228 



MDEAVGDLKQ 
FDEPFLTRNV 
AANHWVLPAA 
PGTGKTSLCK 
DDKDALVFVL 
ITEKIDVAFV 
FIENNVSKLS 
QFEERKKLAA 



11 
I 

ALPCVAESPT 
QSVSIIDTEL 
EFHGLWDSLV 
ALAQKLTIRL 
IDEVESLTAA 
DRADIKQYIG 
LLLNDISRKS 
YI 



21 
I 

VHVEVHQRGS 
KVKDSQPIDL 
YDVEVKSHLL 
SSRYRYGQLI 
RNACRAGTEP 
PPSAAAIFKI 
EGLSGRVLRK 



31 



41 



STAKKEDINL 
SACTVALHIF 
DYVMTTLLFS 
EINSHSLFSK 
SDAIRWNAV 
YLSCLEELMK 
LPFLAHALYV 



SVRKLLNRHN 
QLNEDGPSSE 
DKNVNSNLIT 
WFSESGKLVT 
LTQIDQIKRH 
CQIIYPRQQL 
QAPTVTIEGF 



51 

I 

I VFGDYTWTE 6 0 

NLEEETENII 12 0 

WNRWLLHGP 18 0 

KMFQKIQDLI 240 

SNWILTTSN 300 

LTLRELEMIG 3 60 

LQALSLAVDK 42 0 



Seq ID NO: 291 DNA sequence 

Nucleic Acid Accession #: NM_002658.1 

Coding sequence: 77-1372 

1 11 21 31 41 51 
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GTCCCCGCAG CGCCGTCGCG CCCTCCTGCC GCAGGCCACC GAGGCCGCCG CCGTCTAGCG 60 

CCCCGACCTC GCCACCATGA GAGCCCTGCT GGCGCGCCTG CTTCTCTGCG TCCTGGTCGT 12 0 

GAG CGACTCC AAAGGCAGCA ATGAACTTCA TCAAGTTCCA TCGAACTGTG ACTGTCTAAA 180 

TGGAGGAACA TGTGTGTCCA ACAAGTACTT CTCCAACATT CACTGGTGCA ACTGCCCAAA 24 0 

GAAATTCGGA GGG CAGC ACT GTGAAATAGA TAAGTCAAAA ACCTGCTATG AGGGGAATGG 3 00 

TCACTTTTAC CGAGGAAAGG CCAGCACTGA CACCATGGGC CGGCCCTGCC TGCCCTGGAA 3 60 

CTCTGCCACT GTCCTTCAGC AAACGTACCA TGCCCACAGA TCTGATGCTC TTCAGCTGGG 42 0 

CCTGGGGAAA CATAATTACT GCAGGAACCC AGACAACCGG AGGCGACCCT GGTGCTATGT 480 

GCAGGTGGGC CTAAAGCCGC TTGTCCAAGA GTGCATGGTG CATGACTGCG CAGATGGAAA 540 

AAAGCCCTCC TCTCCTCCAG AAGAATTAAA ATTTCAGTGT GGCCAAAAGA CTCTGAGGCC 600 

CCGCTTTAAG ATTATTGGGG GAGAATTCAC CACCATCGAG AACCAGCCCT GGTTTGCGGC 660 

CATCTACAGG AGGCACCGGG GGGGCTCTGT CACCTACGTG TGTGGAGGCA GCCTCATCAG 72 0 

CCCTTGCTGG GTGATCAGCG CCACACACTG CTTCATTGAT TACCCAAAGA AGGAGGACTA 780 

CATCGTCTAC CTGGGTCGCT CAAGGCTTAA CTCCAACACG CAAGGGGAGA TGAAGTTTGA 840 

GGTGGAAAAC CTCATCCTAC ACAAGGACTA CAGCGCTGAC ACGCTTGCTC ACCACAACGA 900 

CATTGCCTTG CTGAAGATCC GTTCCAAGGA GGGCAGGTGT GCGCAGCCAT CCCGGACTAT 960 

ACAGACCATC TGCCTGCCCT CGATGTATAA CGATCCCCAG TTTGGCACAA GCTGTGAGAT 102 0 

CACTGGCTTT GGAAAAGAGA ATTCTACCGA CTAT CTCT AT CCGGAGCAGC TGAAAATGAC 10 80 

TGTTGTGAAG CTGATTTCCC ACCGGGAGTG TCAGCAGCCC CACTACTACG GCTCTGAAGT 1140 

CACCACCAAA ATGCTATGTG CTGCTGACCC CCAATGGAAA ACAGATTCCT GCCAGGGAGA 1200 

CTCAGGGGGA CCCCTCGTCT GTTCCCTCCA AGGCCGCATG ACTTTGACTG GAATTGTGAG 12 60 

CTGGGGCCGT GGATGTGCCC TGAAGGACAA GCCAGGCGTC TACACGAGAG TCTCACACTT 132 0 

CTTACCCTGG ATCCGCAGTC ACACCAAGGA AGAGAATGGC CTGGCCCTCT GAGGGTCCCC 13 80 

AGGGAGGAAA CGGGCACCAC CCGCTTTCTT GCTGGTTGTC ATTTTTGCAG TAGAGTCATC 1440 

TCCATCAGCT GTAAGAAGAG ACTGGGAAGA TAGGCTCTGC ACAG AT G GAT TTGCCTGTGG 1500 

CACCACCAGG GTGAACGACA ATAGCTTTAC CCTCACGGAT AGGCCTGGGT GCTGGCTGCC 1560 

CAGACCCTCT GGCCAGGATG GAGGGGTGGT CCTGACTCAA CATGTTACTG ACCAGCAACT 1620 

TGTCTTTTTC TGGACTGAAG CCTG CAGGAG TTAAAAAGGG CAGGG CAT CT CCTGTGCATG 1680 

GGCT CGAAGG GAGAGCCAGC TCCCCCGACC GGTGGGCATT TGTGAGGCCC ATGGTTGAGA 1740 

AATGAATAAT TTCCCAATTA GGAAGTGTAA GCAGCTGAGG TCTCTTGAGG GAGCTTAGCC 1800 

AATGTGGGAG CAGCGGTTTG GGG AG C AG AG ACACTAACGA CTTCAGGGCA GGGCTCTGAT 18 60 

ATTCCATGAA TGTATCAGGA AATATATATG TGTGTGTATG TTTGCACACT TGTTGTGTGG 1920 

GCTGTGAGTG TAAGTGTGAG TAAGAGCTGG TGTCTGATTG TTAAGTCTAA ATATTTCCTT 1980 

AAACTGTGTG GACTGTGATG CCACACAGAG TGGTCTTTCT GGAGAGGTTA TAGGT CACTC 2040 

CTGGGGCCTC TTGGGTCCCC CACGTGACAG TGCCTGGGAA TGTACTTATT CTGCAGCATG 2100 

ACCTGTGACC AGCACTGTCT CAGTTTCACT TTCACATAGA TGTCCCTTTC TTGGCCAGTT 2160 

ATCCCTTCCT TTTAGCCTAG TTCATCCAAT CCTCACTGGG TGGGGTGAGG ACCACTCCTT 222 0 

ACACTGAATA TTTATATTTC ACTATTTTTA TTTATATTTT TGTAATTTTA AATAAAAGTG 2280 



295 



WO 02/086443 

ATCAATAAAA TGTGATTTTT CTGA 



PCT7US02/12476 



Seq ID NO: 292 Protein sequence: 
Protein Accession #:NP 002649.1 
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60 



MRAIiLARIiLI) 
HCEIDKSKTC 
YCRNPDNRRR 
GGEFTTIENQ 
RSRLNSNTQG 
PSMYNDPQFG 
CAADPQWKTD 
SHTKEENGLA 



11 

I 

CVLWSDSKG 
YEGNGHFYRG 
PWCYVOVGLK 
PWFAAIYRRH 
EMKFEVENLI 
TSCE I TGFGK 
SCQGDSGGPL 
L 



21 
I 

SNELHQVPSN 
KASTDTMGRP 
PLVQECMVHD 
RGGSVTYVCG 
LHKDYSADTL 
ENSTDYLYPE 
VCSLQGRMTL 



31 

1 

CD CLNGGTCV 
CLPWNSATVL 
CADGKKPSSP 
GSLISPCWVI 
AHHND I ALLK 
QLKMTWKIil 
TGIVSWGRGC 



41 

i 

SNKYFSNIHW 
QQTYHAHRSD 
PEELKFQCGQ 
SATHCFIDYP 
IRSKEGRCAQ 
SHRECQQPHY 
ALKDKPGVYT 



51 
i 

CNCPKKFGGQ 60 

ALQLGLGKHN 12 0 

KTLRPRFKI I 180 

KKEDYIVYLG 240 

PSRTIQTICL 300 

YGSEVTTKML 3 60 

RVSHFLPWIR 420 



Seq ID NO: 2 93 DNA sequence 
Nucleic Acid Accession #: NM_001498 
Coding sequence: 93.. 2006 



11 



65 



GGCACGAGGC 
AGGAGGAGGA 
TGAGCTGGGA 
TCCTGCACAT 
AGGTGGAATA 
CTGGGGAGAA 
CTACCCTTTG 
ACGGAGGAAC 
AGGCTACTTC 
TAGGCTGTCC 
CCAAGTCCCT 
CAAGAAATAT 
ACAAGAATAC 
CTTCTAAGCC 
TCCAGGTGAC 
CTACTATCTG 
TGT CAGACAT 
AGGAGCGAGG 
ACTCAATAGA 
TAGATAAAGA 
ATGTTGCTCA 
ATGATGCTAA 
GATTTAAGCC 
AGGTGCAATT 
GAGTGAT CCT 
TGAAGGTAGC 
TTTGCAAAGG 
TCGCTGCAGA 
TGTTTCCTGG 
ACACCAGATG 
TAATGACAGT 
ACAGTGTCAT 
ATGAATTATG 
GAAGTAAAAC 
ACTGGCTACA 
CTGTACTGTT 
TCTAGAGTTT 
AATAACATAT 
CAACCTACTG 
GAGTTAAAAT 
TGAAATTTTT 
TGTCTACATT 
GCACCTTATC 
GCTTTCCCCT 



TGAGTGTCCG 

GGAGGAGGAG 

GGAAACCAAG 

CTACCACGCC 

CATGTTGGTA 

AGTTCTTGAA 

GAGACCAGAG 

AATGTCCGAG 

TAT AT T AG AA 

TGGGTTCACA 

CTTCTTTCCA 

CCGACATAGG 

ACCATCTCCA 

GGATCATATT 

ATTCCAAGCC 

TCCAATTGTT 

TGATTGTCGC 

ACTGGAGCCA 

CAGCTATTTA 

GATCTACGAA 

TCTCTTTATT 

TGAGTCTGAC 

CCCTCCTCCA 

AACAGACTTT 

TTCCTACAAA 

ACAGAAAAGA 

TGGCAATGCA 

GGAGTACACC 

ACTGATCCCA 

TAGTATTCTG 

TGCCAGATGG 

AACTGATGAA 

TGAATGCCCA 

TGACTCATCC 

GTACCATGCC 

TTCTGGGCCA 

ATACAGTGTA 

CTAAAGTCAT 

TCTAAGCAGT 

GTTTACTGTA 

CTCTTTAAAA 

AAATCACTTG 

TATGATGTTT 

CTGAATAAAT 



21 

I 

TCTCGCGCCC 
GAGGGGG CGG 
CGCCATGCCG 
GTCAAGGACC 
TCTTTTGATC 
ACTCTGCAAG 
TATGGGAGTT 
TTCAATACAG 
GAAAATCAGG 
CTGCCCGAGG 
GATGAAGCAA 
AGAGGAGAAA 
TTTATAGAAA 
TACATGGATG 
TGCAGTATAT 
ATGGCTTTGA 
TGGGGAGTGA 
TTGAAGAACA 
TCTAAGTGTG 
CAGCTGTTGC 
AGAGACCCAC 
CATTTTGAGA 
AACTCAGACA 
GAGAACTCTG 
TTGGATTTTC 
GATGCTGTCT 
GTGGTGGATG 
CTCATGAGCA 
ATTCTGAACT 
AACTACCTAA 
ATGAGGGAGT 
ATGAATTATA 
GAGTTACTTG 
AACTAGACAT 
TCTCAGCCCG 
GTGAGCCAGA 
CATGTACATA 
CATGAACTGG 
TTTGTAAATG 
AATTTTTGTT 
ACATTTTCTC 
AATCCATTGA 
CTTTTGCAAT 
ACCCATTGAA 



31 



41 



GGAAGCGGGC 
CCATGGGGCT 
ACCACGTGCG 
GGCACAAGGA 
ATGAAAATAA 
AGAAGGGGGA 
ACATGATTGA 
TTGAGGCCAA 
CTCTTTGCAC 
TCAAACCCAA 
TAAACAAGCA 
AGGTTGTCAT 
CATTTACTGA 
CCATGGGATT 
CTGAGGCCAG 
GTGCTGCATC 
TTTCTGCATC 
ATAACTATAG 
GTGAGAAATA 
AGGAAGGCAT 
TGACACTGTT 
ATATTCAGTC 
TTGGATGGAG 
CCTATGTGGT 
TCATTCCACT 
TGCAGGGAAT 
GTTGTGGCAA 
TAGACACCAT 
CTTACCTTGA 
AGCTAATTAA 
TTATCGCAAA 
GCCTTATTTT 
GATCAGCATT 
TCTACAGAAA 
TGTGTATAAT 
AATTGATTAA 
GTAAAGTATT 
CTTGTACATT 
TACTGGTAAT 
CTTTTAAAGA 
TCGTTAATTT 
AAGTGCTTCA 
TGGAATAATC 
CTCTGAAAAA 



GACCGCCGTC 
GCTGTCCCAG 
GCGGCACGGG 
CGTTCTCAAG 
AAAAGTCCGG 
AAGGACAAAC 
AGGGACACCA 
CATGCGAAAA 
AATAACTTCA 
CCCAGTGGAA 
CCCTCGCTTC 
CAATGTACCA 
GGATGATGAA 
TGGAATGGGC 
ATACCTTTAT 
TCCCTTTTAC 
TGTAGATGAT 
GATCAGTAAA 
TAATGACATC 
TGATCAT CTC 
TGAAGAGAAA 
CACAAATTGG 
AGTAGAATTT 
GTTTGTGGTA 
GTCAAAGGTT 
GTTTTATTTC 
GGCCCAGAAC 
CATCAATGGG 
AAACATGGAA 
GAAGAGAGCA 
CCATCCTGAC 
GAAGTGTAAC 
TAGGAAAGTA 
GAAAAATGCA 
ATGAAGACCA 
GGCTTTCTTT 
TTTGATTAAC 
TTTAAATTCT 
TGTACAATAC 
CTACCTGGGA 
TCCTTTGTCA 
AGGGTAATCT 
ACTTGGTCAC 
AAAAAAAAAA 



51 

AGCCCGGAGG 60 

GGCTCGCCGC 12 0 

ATCCTCCAGT 180 

TGGGGCGATG 240 

TTGGTCCTGT 30 0 

CCAAACCATC 360 

GGACAGCCCT 420 

CGCCGGAAGG 480 

TTTCCCAGAT 540 

GGAGGAGCTT 600 

AGTACCTTAA 660 

ATATTTAAGG 72 0 

GCTTCAAGGG 780 

AATTGCTGTC 840 

GATCAGTTGG 900 

CGAGGCTATG 960 

AGAACT CGGG 102 0 

TCCCGATATG 1080 

GACTTGACGA 114 0 

CTGGCCCAGC 12 00 

ATACACCTGG 12 60 

CAGACAATGA 1320 

CGACCCATGG 13 8 0 

CTGCTCACCA 144 0 

G ATG AGAACA 150 0 

AGGAAAGAT A 1560 

AGCACGGAGC 1620 

AAGGAAGGTG 168 0 

GTGGATGTGG 1740 

TCTGGAGAAC 180 0 

TACAAGCAAG 1860 

CAAATTGCAA 192 0 

AAATATAGTG 1980 

TTATTGACGA 2040 

AATGATAGAA 210 0 

GGTAGGTAAA 2160 

AATGTATTTT 222 0 

TACTCTGGAG 22 8 0 

TTGCATTCCA 2340 

CCTGATTTAT 240 0 

TTTCCTTTGT 2460 

TGGGTTTCTA 2520 

CTTGCCCCAA 2580 
AAAA 



70 Seq ID NO: 2 94 Protein sequence: 
Protein Accession #: NP 001489 



75 



80 



85 



MGLLSQGSPL 
ENKKVRLVLS 
EANMRKRRKE 
NKHPRFSTIiT 
MGFGMGNCCIi 
SASVDDRTRE 
EGIDHLIiAQH 
GWRVEFRPME 
QGMFYFRKDI 
YLENMEVDVD 
LILKCNQIAN 



11 
I 

SWEETKRHAD 
GEKVL.ETLQE 
ATSILEENQA 
RNIRHRRGEK 
QVTFQACSIS 
ERGLEPLKNN 
VAHLFIRDPL 
VQLTDFENSA 
CKGGNAWDG 
TRCSILNYLK 
ELCECPELLG 



21 
I 

HVRRHGILQF 
KGERTNPNHP 
LCTITSFPRL 
WINVPIFKD 
EARYLYDOLA 
NYRI SKSRYD 
TLFEEKIHLD 
YWFWLLTR 
CGKAQNSTEL 
LIKKRASGEL 
SAFRKVKYSG 



31 
I 

LH I YHAVKDR 
TLWRPEYGSY 
GCPGFTLPEV 
KNTPSPFIET 
TICPIVMALS 
SIDSYLSKCG 
DANESDHFEN 
VILSYKLDFL 
AAEEYTLMS I 
MTVARWMREF 
SKTDSSN 



41 
i 

HKDVLKWGDE 
MIEGTPGQPY 
KPNPVEGGAS 
FTEDDEASRA 
AASPFYRGYV 
EKYNDIDLTI 
IQSTNWQTMR 
IPLSKVDENM 
DTIINGKEGV 
IANHPDYKQD 



51 

I 

VEYMLVSFDH 60 

GGTMSEFNTV 120 

KSLFFPDEAI 18 0 

SKPDH I YMDA 240 

SDIDCRWGVI 300 

DKEIYEQLLQ 3 60 

FKPPPPNSDI 42 0 

KVAQKRDAVL 480 

FPGLIPILNS 540 

SVITDEMNYS 600 



296 




297 



WO 02/086443 

TCAGCAAAGA TAGGATGATG CAGAAACCTG GTAGCAATGC ACCTGTGGGA GGAAACGTTA 

CCAGCAGTTT CTCTGGAGAT GACCTAGAAT GCAGAGAAAC AGCCTCCTCT CCCAAAAGCC 

AACAAGAAAT TAATGCTGAT ATAAAACGTA AATTAGTGAA GGAACTCCGA TGCGTTGGAC 

AAAAATATGA AAAAATCTTC GAAATGCTTG AAGGAGTGCA AGGACCTACT GCAGTCAGGA 

AACGATTTTT TGAATCCATC ATCAAGGAAG CAGCAAGATG TATGAGACGA GACTTTGTTA 

AGCACCTTAA GAAGAAACTG AAACGTATGA TTTGAGAATA CTTGTCCCTG GAGG AT TAT C 

ACACCCCAAA TGCATAATCT CATTAATGAT TGAGGAGAGA AAAGGATCAG ATTGCTGTTT 

TCTACAATGG AGCAGGATAT TGCTGAAGTC TCCTGGCATA TGTTACCGAA TCAACTGGCC 

TTCCAGAGGC TAAGAAATTT CTGTTAGTAA AAGATGTTCT TTTTCCCAAA GCGTTTTATT 

TGAAAGGATA ACTTGTGTTT TGGTTATTTT GTATTCCCAC CTGTGCTGGT AGATATTATT 

AACCCATTAG GTAAATACTA TTACAGTCGT GGTTTCTGCA 

Seq ID NO: 3 00 Protein sequence: 
Protein Accession #: Eos sequence 

1 11 21 31 

1111 
MTDKTEKVAV DPETVFKRPR ECDSPSYQKR QRMALLARKQ 

GHAIPPSQLD SQIDDFTGFS KDRMMQKPGS NAPVGGNVTS 

EINADIKRKL VKELRCVGQK YEKIFEMLEG VQGPTAVRKR 

LKKKLKRMI 

Seq ID NO: 3 01 DNA sequence 
Nucleic Acid Accession #: Eos sequence 
Coding sequence: 247-812 

I 11 21 31 41 51 

II I I 1 I 
AGTGTTCGGC TGGGGCAGGC ACGCTGTGGC TGGCTACTTC CCTTCCTCCC ATCCCCCTTG 
GGCCAAACGG GATCGGTGCT TCTGGTGAGA CGCCTCCCCA TGCACATCAC TCCCAGGTGC 
CCTAGGGGGC ACATTTCCCA CAACTCCCAG AGGGCAGGTT TCTAGAAAGT GCCACCAGTG 
GGGAGGCGCC ACAACTTCAC TGCCATTTTG TGAGGTGCCG CCGTCTCTCC TCCAGCAAGG 
GAAACAATGA CCGATAAAAC AGAGAAGGTG GCTGTAGATC CTGAAACTGT GTTTAAACGT 
CCCAGGGAAT GTGACAGTCC TTCGTATCAG AAAAGGCAGA GGATGGCCCT GTTGGCAAGG 
AAACAAGGAG CAGGAGACAG CCTTATTGCA GGCTCTGCCA TGTCCAAAGA AAAGAGCTTA 
TGACAGGACA TGCTATTCCA CCCAGCCAAT TGGATTCTCA GATTGATGAC TTCACTGGTT 
TCAGCAAAGA TGGGATGATG CAGAAACCTG GTAGCAATGC ACCTGTGGGA GGAAATGTTA 
CCAGCAATTT CTCTGGAGAT GACCTAGAAT GCAGAGGAAT AGCCTCCTCT CCCAAAAGCC 
AACAAGAAAT TAATGCTGAT ATAAAATGTC AAGTAGTGAA GGAAATCCGA TGCCTTGGAC 
AATATGAAAA AATCTTCGAA ATGCTTGAAG GAGTGCAAGG ACCTACTGCA GTCAGGAAAC 
GATTTTTTGA ATCCATCATC AAGGAAGCAG CAAGATGTAT GAGACGAGAC TTTGTTAAGC 
ACCTTAAGAA GAAACTGAAA CGTATGATTT GAGAATACTT GTCCCTGGAG GATTATCACA 
CCCCAAATGC ATAATCTCAT TAATGATTGA GGAGAGAAAA GGATCAGATT GCTGTTTTCT 
ACAATGGAGC AGGATATTGC TGAAGTCTCC TGGCATATGT TACCGAATCA ACTGGCCTTC 
CAGAGG CTAA GAAATTTCTG TTAGTAAAAG ATGTTCTTTT TCCCAAAGCG TTTTATTTGA 
AAGGATAACT TGTGTTTTGG TTATTTTGTA TTCCCACCTG TGCTGGTAGA TAT TAT T AAC 
CCATTAGGTA AATACTATTA CAGTCGTGGT TTCTGCA 

Seq ID NO: 302 Protein sequence: 
Protein Accession #: Eos sequence 

1 11 21 31 

till 
MTDKTEKVAV DPETVFKRPR ECDSPSYQKR QRMALLARKQ 

GHAIPPSQLD SQIDDFTGFS KDGMMQKPGS NAPVGGNVTS 

EINADIKCQV VKEIRCLGQY EKI FEMLEGV QGPTAVRKRF 

KKKLKRMI 

Seq ID NO: 303 DNA sequence 
Nucleic Acid Accession #: Eos sequence 
Coding sequence : 247-815 

1 11 21 31 41 51 

111111 
AGTGTTCGGC TGGGACAGGC ACGCTGTGGC TGGCTACTTC CCTTCCTTCC ATCCCCCTTG 

GGCCAAACAG GATCGGTGCT TCTGGTGAGA CGTCTCCCCA TGCACATCAC TCCCAGATGC 

CCTAGGGGGC ACATTTCCCA CAACTCCCAG AGGGCAGGTT TCTAGAAAGT GCCACCAGTG 

GGGAGGCGCC ACAACTTCAC TGCCATTTTG TGAGGTGCCG CCGTCTCTCC TCCAGCAAGG 

GAAACAATGA CCGATAAAAC AGAGAAGGTG GCTGTAGATC CTGAAACTGT GTTTAAACGT 

CCCAGGGAAT GTGACAGTCC TTCGTATCAG AAAAGGCAGA GGATGGCCCT GTTGGCAAGG 

AAACAAGGAG CAGGAGACAG CCTTATTGCA GGCTCTGCCA TGTCCAAAGC AAAGAGCTTA 

TGACAGGACA TGCTATTCCA CCCAGCCAAT TGGATTCTCA GATTGATGAC TTCACTGGTT 

TCAGCAAAGA TAGGATGATG CAGAAACCTG GTAGCAATGC ACCTGTGGGA GGAAACGTTA 

CCAGCAGTTT CTCTGGAGAT GACCTAGAAT GCAGAGAAAC AGCCTCCTCT CCCAAAAGCC 

AACAAGAAAT TAATGCTGAT ATAAAACGTA AATTAGTGAA GGAACTCCGA TGCGTTGGAC 

AAAAATATGA AAAAATCTTC GAAATGCTTG AAGGAGTGCA AGGACCTACT GCAGTCAGGA 

AACGATTTTT TGAATCCATC ATCAAGGAAG CAGCAAGATG TATGAGACGA GACTTTGTTA 

AGCACCTTAA GAAGAAACTG AAACGTATGA TTTGAGAATA CTTGTCCCTG GAGGATTATC 

ACACCCCAAA TGCATAATCT CGTTAATGAT TGAGGAGAGA AAAGGATCAG ATTGCTGTTT 

TCTACAATGG AGCAGGATAT TGCTGAAGTC TCCTGGCATA TGTTACCGAA TCAACTGGCC 

TTCCAGAGGC TAAGAAATTT CTGTTAGTAA AAGATGTTCT TTTTCCCAAA GCGTTTTATT 

TGAAAGGATA ACTTGTGTTT TGGTTATTTT GTATTCCCAC CTGTGCTGGT AGATATTATT 

AACCCATTAG GTAAATACTA TTACAGTCGT GGTTTCTGCA 

Seq ID NO: 304 Protein sequence: 
Protein Accession #: Eos sequence 



41 51 

1 1 
GAGDSLIAGS AMS KAKKLMT 

SFSGDDLECR ETASSPKSQQ 

FFESI IKEAA RCMRRDFVKH 



41 
I 

GAGDSLIAGS 
NFSGDDLECR 
FESIIKEAAR 



51 

I 

AMSKEKKLMT 
GIASSPKSQQ 
CMRRDFVKHL 
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65 



WO 02/086443 

1 11 21 31 41 51 

I I I I I I 

MTDKTEKVAV DPETVFKRPR ECDSPSYQKR QRMALLARKQ GAGD S L I AGS AMSKAKKLMT 

GHAIPPSQLD SQIDDFTGFS KDRMMQKPGS NAP VGGNVT S SFSGDDLECR ETASSPKSQQ 

EINADIKRKL VKELRCVGQK YEKIFEMLEG VQGPTAVRKR FFESIIKEAA RCMRRDFVKH 

LKKKLKRMI 

Seq ID NO: 305 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 87-689 



PCT/US02/12476 



1 



li 



i 



70 



CGTGGAGGCA 
CCAGACTAGC 
AGATGTCCGC 
CAGAGGTCCC 
TGTCCGGGAA 
AT CGGGAAAT 
CTCCCAAAAG 
AATCCACAAA 
AT AAT T T AAA 
AGT AT GAG AA 
CTGCTAAAGT 
AGGAGGAGGA 
TTAGAGTAGG 
ATTAGGTTTA 
AATTGTCAGT 
AAGTTGTACA 
CTGTGCACTT 
ATTTGTAAGG 
TATCTATAGT 
GCGTTGAGGC 
GAGGCTGGAC 
GTATATAGTG 
CATGAGAATA 
TAT AGAACT C 
CTCCTGTACT 
GAAATGTTTT 
AGTCAATTTC 
CTCCCTATAA 
TGAAGGAGAG 
ATGAAGT CTG 
AGGAAGGTGG 
CCTATTTTGT 
AAATTAAGGC 
ACATTATTTG 
AGTGAGGGTA 
TTGGAAACAC 
AGGGCAGGCT 
GCCTGCTCAT 
GAAGGAGCTT 
GTTGGGGTGA 
CTGATGTGTA 
GTGAGTGTTG 
CGCAGGAGTG 
GTTGAGAAAC 
TACGAGTTAT 
CATC AGAACT 
AAAACTCGGT 
GCCATGTCCT 
CTAGGCCAAG 
GGTCAAAAGG 
CAGGGAAGGG 
GTGGGGGAGC 
TGTCAAGTTG 
CACACTGTGG 
AAGTGGCATG 
TTCTTAAGAT 
CTACTCCCTC 
AGGCTGTGAT 
GTATTTGGGG 



GCTAGCGCGA 
GAACAATACA 
TTATGCCTTC 
TGTCAATTTT 
AGAGAAATCT 
GAAGGATTAT 
GCCACCGTCT 
CCCCGGCATC 
TGACAGTGAA 
GGATGTTGCT 
TGCCCGGAAA 
GGAGGAGGAG 
GGAGCGCCGT 
ATTACAAAAT 
GGTTTACATG 
TATTTCCAAA 
TGCTGTTGGT 
TGGTGGTAAC 
TTGTAAAAAG 
TGTGGGG AAG 
CTGTTGACTC 
ACATAGCATT 

1* 'J' IJI IJI IJI 

TTCATTGTCA 
TAAACACGAT 
TGAAGTTAAA 
TGACTCACAG 
ATGTGGTAGC 
GGCTACTTGA 
GAGGAGTTAG 
GTGATTAGGA 
GGGGCCAAAT 
CTTATTGTTT 
TGGTGCCCAA 
TGTGGGATGG 
CAAACACCCC 
AATGGAATCA 
AAGTTTAGCT 
GGTTTGTGTG 
GGGGAGATGG 
TATACATCAT 
CTATTGCCCA 
TTTTTGTGCT 
TTGCATGTCT 
GGTCACGGTC 
GTTTGTCCTG 
TGTGAGGTTT 
TGTCACTTGG 
ATTCGGGAGC 
GAGTGATTTG 
CCAAGGATGG 
AGTTTAGCCA 
AGGCCACTTG 
CAAGATTGCT 
ATGTTACCTA 
GCCAACCTGT 
TAACCACCTC 
GTAGTGACTA 
ACGTTGGATG 



21 

I 

GGCTGGGGAG 
GTCAGGATGG 
TTTGTGCAGA 
GCGGAATTTT 
AAATTTGATG 
GGACCAG CT A 
GGATTCTTCC 
TCTATTGGAG 
AAGCAGCCTT 
GACTATAAGT 
AAGGTGGAAG 
GATGAATAAA 
AATTGACACA 
TTGATCACGA 
AAGTGGCCAT 
CATT TTTAAA 
GTGACAAGGC 
TATGGTTATT 
AACAAAACAA 
ATGCCTTTTG 
TGCAGGGGGC 
CTGCTGCCAJT 
TAAGTGCGGT 
GCAAAGCAAA 
TCGCAACGTT 
TAAACAGTAT 
CAGTGAACAA 
TTCTTTTATT 
AGCTACTGTG 
GAGAACGACA 
CTGAGGCTAT 
GCATTGCTAA 
TTCTCTTTCA 
CATTTGGGGT 
GGTGGTGGGG 
AAGGAAGATG 
AC CAT T T CTG 
CATTCACTGG 
TCAGTGGTTA 
CCACAGTAGC 
TACTGTCCGT 
GCATTAATAT 
ATTAATTTTA 
GGAGGCGGTG 
ACAGCCTGAT 
AATGTGTTCC 
GCCCAGAGGC 
CATT CTAAGC 
TGTTGCCAGC 
TTAAGTGGTG 
AAAGGGGTAA 
GATGAT CTTT 
GTCCATTAGC 
CTTCTAGTGG 
AGGCTTAGGC 
TGCTTTTTTT 
ACCCCATTCT 
TTGTCTGTGT 
CATTCATTTT 



31 



41 



I 



CGCTGAGCCG 

CTAAAGGTGA 

CATGCAGAGA 

CCAAGAAGTG 

AAATGGCAAA 

AGGGAGGCAA 

TGTTCTGTTC 

ACGTGGCAAA 

ACATCACTAA 

CGAAAGGAAA 

AGGAAGATGA 

GAAACTGTTT 

TCTCTTATTT 

TCATATTGTA 

GGGTGTCTGG 

ATGAAAAGGC 

ATTTAAAGAT 

GGCTAGAAAT 

CCGAGACAAA 

GGAGAGGCTG 

ATCCATTTAG 

CTTAGCTGTG 

AGTTTTTAAA 

GAGTCACTGC 

CTGTTATTTT 

TACATTTTTA 

ACCCCCACTC 

ACTCAGTGGC 

TGATTTTGTT 

TAGGCAAGGT 

CTAGGTTTAA 

ACAGCAATTT 

CCCCTACCCC 

CTTGAGCCTG 

TAGGGGACGG 

ATAGGCTCCA 

AGCACTAAAT 

AAATGTAGAT 

TATTAGTGGG 

AAGTGGTGAC 

AGCAATGAAG 

TTGGGTGTGT 

AGAGAAAGCA 

TCCTCTCCGC 

CTCTTATGTG 

TCTAGT TCTA 

ACTTGTTCCA 

TAAAGCTTTA 

CTCGTCAAAT 

CGCGTCTATC 

CTTTTGTGCT 

GATTAGGCAA 

TGGGGCAGCA 

AATAATGCCC 

TTAGCTTGAT 

TTTTTTTTCC 

TGAATGACAT 

CTCCTGTGTG 

CTGTAATAAA 



CGCGTCGTGC 
CCCCAAGAAA 
AGAACATAAG 
CTCTGAGAGG 
GGCAGATAAA 
GAAGAAGAAG 
AGAATTCCGC 
AAAGCTGGGT 
GGCGGCAAAG 
GTTTGATGGT 
AGAAGAGGAG 
ATCTGTCTCC 
GAGAAGTGTC 
GTCTCTCAAA 
AGCACCCTGA 
ACTCTCGTGT 
GTTTCTGGCA 
CCTGAGTTTT 
CCCTTGATGC 
TAGCTCAGGG 
CTTCAGGTTG 
GACAAAGGGG 
CTGTTTGTTT 
ATCAATGAAA 
TTTTGTATGT 
AAACTCTTCT 
CATTGTATTT 
CAGCTCACTT 
TGTGTCTGAG 
TCAGCAGCCT 
CTTTTGTCCC 
CAGAGTGTAT 
CCGTGCTCCT 
CTGCTGGTCT 
TATCCTTTTT 
TCTTGGGCCA 
GTATCATGAA 
TGATGTTCAA 
TAGTGTAACA 
ACTAAATACC 
GATACAGTAC 
ATGTTTGAGG 
GCTTTTTCTT 
CCTGTCGGGT 
TTCATAGCCA 
GAAAATGACC 
GAATTTCCCC 
GCTT CCCAAT 
ATGGAAGAGA 
TCATAACTAG 
TCCAAAGTAG 
ACATTGAGTT 
AGAT CACT AC 
TAGTTTCTCT 
TTCTGGGCCC 
CCCATTTAAA 
TTTATCCTTC 
TGTCTGTTCT 
G 



51 
I 

CCTGCGCTGC 
CCAAAGGGCA 
AAGAAAAACC 
TGGAAGACGA 
GTGCGCTATG 
GATCCTAATG 
CCCAAGATCA 
GAGATGTGGA 
CTGAAGGAGA 
GCAAAGGGTC 
GAGGAAGAAG 
TTGTGAATAC 
TGTTGCCCTC 
GTGCTCTAGA 
AACTGTAT CA 
TCTCCTCACT 
TTTTCTTTTT 
CAACTGTATA 
TCCTTGCTCG 
CGTGCACTGT 
TCTTGTTTCT 
GGTCAGCTGG 
TTAAACAAAC 
GTTCAAGAAC 
TTAGAATGCT 
CTATTATAAC 
GGAGACTGGC 
AGGGCTGAGA 
TGGCATTCAG 
TCCAAGGTAT 
ACCTCCACCC 
GGTGTGTCAA 
GGCACAT AT C 
CCTGGATGCC 
TTGCTCCTAC 
CCTGAGCTAT 
AAGTTGAATG 
TGTTAAACTG 
TTTTATCCAG 
ATTTTGAAGG 
TGTGTTGTGG 
CTATGAAACA 
AAAATTCACT 
CCTGGATGAG 
TTCGCTCTCC 
ACTAATTTAA 
TCCTGCTTCA 
TCGTGATGTG 
AACAACCTGC 
ATGTACCAAC 
CTAAGCAGAA 
TTAAAGAGGC 
TCAACGTTTT 
GAGATGATGT 
ACTGTCTGTG 
AGGATAGTAC 
GGAAAGAACA 
TGTCACAAAT 



60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 



75 



80 



Seq ID NO: 306 Protein sequence: 
Protein Accession #: NP_005333.1 

1 11 21 31 41 51 

I I I I I I 

MAKGDPKKPK GKMSAYAFFV QTCREEHKKK NPEVPVNFAE FSKKCSERWK TMSGKEKSKF 
DEMAKADKVR YDREMKDYGP AKGGKKKKDP NAPKRPPSGF FLFCSEFRPK IKSTNPGISI 
GDVAKKLGEM WNNLND SEKQ PYITKAAKLK EKYEKDVADY KSKGKFDGAK GPAKVARKKV 
EEEDEEEEEE EEEEEEEEDE 



60 
120 
180 



Seq ID NO: 307 DNA sequence 
85 Nucleic Acid Accession #: NM_022342 
Coding sequence: 1..2178 



299 



WO 02/086443 

1 11 21 31 41 51 

I I I I I I 

ATGGGTACTA GGAAAAAAGT TCATGCATTT GTCCGTGTCA AACCCACCGA TGACTTTGCT 60 

CAT G AAATG A TCAGATACGG AGATGACAAA AGAAGCATTG ATATTCACTT AAAAAAAGAC 120 

AT T CGG AG AG GAGTTGTCAA TAACCAACAG ACAGACTGGT CGTTTAAGTT GGATGGAGTT 180 

TTCACGATG CCTCCCAGGA CTTGGTTTAT GAGACAGTTG CAAAGGATGT GGTTTCTCAG 240 

CCCTCGATG GCTATAATGG CACCATCATG TGTTATGGGC AGACGGGAGC TGGCAAGACA 300 

ACACCATGA TGGGGGCAAC TGAGAATTAC AAGCACCGGG GGATCCTCCC TCGTGCCCTG 3 60 

AGCAGGTTT TTAGGATGAT CGAAGAACGC CCCACACATG CCATCACTGT GCGTGTTTCC 42 0 

ACTTGGAAA TCTATAATGA GAGCCTGTTT GATCTCCTGT CCACTCTGCC CTATGTTGGA 480 

CCTCAGTCA CACCAATGAC CATCGTGGAA AACCCTCAAG GAGTCTTCAT TAAGGGCTTG 540 

CAGTTCACC TCACAAGTCA GGAGGAGGAT GCATTCAGCC TCCTTTTTGA GGGTGAGACC 600 

ACAGGATTA TAGCCTCCCA CACTATGAAC AAAAACTCTT CCAGATCACA CTGCATTTTC 660 

CCATCTACT TAGAGGCCCA TTCCCGGACC TTATCAGAGG AAAAGTACAT CACTTCCAAA 72 0 

TTAACTTGG TGGATCTGGC AGGCTCAGAG AGGCTGGGGA AGTCTGGGTC TGAGGGCCAA 780 

TCCTGAAGG AAGCCACCTA CATCAACAAA TCGCTCTCAT TCCTGGAGCA GGCCATCATT 840 

CCCTTGGGG ACCAGAAGCG GGACCACATC CCCTTTCGGC AGTGCAAGCT CACCCACGCT 900 

TGAAGGACT CGTTAGGGGG AAACTGCAAT ATGGTCCTCG TGACAAACAT CTATGGAGAA 960 

CTGCCCAGT TAGAAGAAAC GCTATCTTGA CTGAGATTTG CCAGCAGGAT GAAGCTAGTC 102 0 

CCACTGAGC CTGCCATCAA TGAAAAGTAT GATGCTGAGA GAATGGT CAA GAACCTGGAG 1080 

AGGAACTAG CACTACTCAA GCAGGAG CTG GCTATCCATG ACAGCCTGAC CAACCGCACC 1140 

TTGTGACCT ATGACCCCAT GGATGAAATC CAGATTGCTG AGATCAACTC CCAGGTGCGG 120 0 

GGTACCTGG AGGGGACACT GGACGAGATC G ACATAAT CA GCCTTAGACA GATCAAGGAG 12 60 

TGTTCAACC AGTTCCGGGT GGTTCTGAGC CAACAGGAAC AGGAAGTGGA GTCCACTTTG 1320 

GCAGGAAGT ACACCCTCAT TGACAGGAAT GACTTTGCAG CCATTTCTGC TATCCAGAAG 1380 

CGGGGCTTG TGGATGTTGA TGGCCACCTA GTGGGTGAGC CTGAAGGACA AAACTTTGGA 1440 

TCGGAGTCG CCCCTTTCTC TACCAAACCT GGGAAGAAAG CCAAGTCCAA GAAGACATTC 1500 

AAGAGCCAC TCAGGCCCGA CACCCCACCC TCCAAACCAG TGGCCTTTGA GGAGTTTAAG 1560 

ATGAGCAAG GTAGTGAGAT CAACCGAATT TTCAAAGAAA ACAAATCCAT CTTGAATGAA 1620 

GGAGGAAAA GGGCCAGCGA GACCACACAG CACAT CAATG CC AT CAAGCG GGAGATTGAT 1680 

TGACCAAGG AGGCCCTGAA TTTCCAGAAG TCACTACGGG AGAAGCAAGG CAAGTACGAA 1740 

ACAAGGGGC TGATGATCAT CGATGAGGAA GAATTCCTGC TGATCCTCAA GCT CAAAGAC 1800 

TCAAGAAGC AGTACCGCAG CGAGTACCAG GACCTGCGTG ACCTCAGGGC TGAGAT CCAG 1860 

ATTGCCAGC ACCTAGTGGA TCAGTGTCGC CACCGCCTGC TCATGGAATT TGACATCTGG 192 0 

ACAATGAGT CCTTTGTCAT CCCTGAGGAC ATGCAGATGG CACTGAAGCC AGGCGGCAGC 1980 

TCCGGCCAG GCATGGTCCC TGTGAACAGG ATTGTGTCTC TGGGAGAAGA TGACCAGGAC 2040 

AATTCAGCC AGCTGCAGCA GAGGGTGCTT CCTGAGGGCC CTGATTCCAT CTCCTTCTAC 210 0 

ATGCCAAAG T CAAGATAG A GCAGAAGCAT AATTACTTGA AAACCATGAT GGGCCTCCAG 2160 
AGGCACATA GAAAATAG 

Seq ID NO: 308 Protein sequence: 
Protein Accession #: NP_071737 

1 11 21 31 41 51 

I l I l I l 

MGTRKKVHAF VRVKPTDDFA HEMIRYGDDK RSIDIHIiKKD IRRGWNNQQ TDWSFKLDGV 60 

LHDASQDIiVY ETVAKDWSQ ALDGYNGTIM CYGQTGAGKT YTMMGATENY KHRGILPRAL 120 

QQVFRMIEER PTHAITVRVS YLEIYNESLF DLLSTLPYVG PSVTPMTIVE NPQGVFIKGI) 180 

SVHIiTSQEED AFSLLFEGET NRIIASHTMN KNSSRSHCIF TIYLEAHSRT LSEEKYITSK 240 

INLVDLAGSE RLGKSGSEGQ VLKEATYINK SLSFLEQAII ALGDQKRDHI PFRQCKLTHA 300 

LKDSLGGNCN MVLVTNIYGE AAQLEETLSS LRFASRMKLV TTEPAINEKY DAERMVKNLE 360 

KELiALLKQEIj AIHDSLTNRT FVTYDPMDEI QIAEINSQVR RYLEGTLDEI DIISLRQIKE 420 

VFNQFRWTjS QQEQEVESTL RRKYTLIDRN DFAAISAIQK AGLVDVDGHL VGEPEGQNFG 480 

LGVAPFSTKP GKKAKSKKTF KEPLRPDTPP SKPVAFEEFK NEQGSEINRI FKENKSILNE 540 

RRKRASETTQ HINAIKREID VTKEADNFQK SLREKQGKYE NKGLMI IDEE EFLLILKLKD 600 

LKKQYRSEYQ DLRDLRAEIQ YCQHLVDQCR HRLLMEFDIW YNESFVIPED MQMALKPGGS 660 

IRPGMVPVNR IVSLGEDDQD KFSQLQQRVL PEGPDSISFY NAKVKIEQKH NYLKTMMGLQ 72 0 
QAHRK 

Seq ID NO: 309 DNA sequence 

Nucleic Acid Accession #: CAT cluster 

1 11 21 31 41 51 

I I I I I I 

TTTTTTTTTT TTTTTTTTAA TGCCTGCTGT CATGCTCTGT CTACCAGGGT GAATTTCCAA 60 

AAATTTCTGC ATAGCAATTT TAGCCAAAAC TATATATGTT CTGGGGAGGA TAGGCATAGG 12 0 

CACATTGAAG ACCAAAGGAA AGAGTGAAGA AGTGTAGTTG GGTCATTGTG AATGGATGTT 180 

TAGATTGTCA AGAAAAGTGG GCCAGAGGCC CCACCTCACA CTAGGACGGC AATTGCCTCT 240 

CATTAGTATC TCAGGCACCA TGGGTCT TAT TTGGTGTCAT AAGAAACACC CTCAACAAAG 300 

TAATGAACCC TCAGCCTCCA GCTTCTCTTC TTCGGGATTC TTCTTAGGGC CTCCTTTTTC 3 60 

CTTTTATGTT TCCAGTACCC TGAATTTCTT ATTCCCATCC CCCATTAAAA TCTGCTTCAA 42 0 

AGAAAAAACA AGAAGGACAC ATTCACTTTA AGATCCAAAT GAATGATAAG AGCTTAAAAC 480 
ATTATACTTA TCAGTATTAT TTGCATTTTT ATAGAAACCA AAACCATATT TCAACAAC 

Seq ID NO: 310 DNA sequence 

Nucleic Acid Accession #: NM_018622.2 

Coding sequence : 1-1140 

1 11 21 31 41 51 

I I I I I i 

ATGGCGTGGC GAGGCTGGGC GCAGAGAGGC TGGGGCTGCG GCCAGGCGTG GGGTGCGTCG 60 
GTGGGCGGCC GCAGCTGCGA GGAGCTCACT GCGGTCCTAA CCCCGCCGCA GCTCCTCGGA 12 0 
CGCAGGTTTA ACTTCTTTAT TCAACAAAAA TGCGGATTCA GAAAAGCACC CAGGAAGGTT 180 
GAACCTCGAA GATCAGACCC AGGGACAAGT GGTGAAGCAT ACAAGAGAAG TGCTTTGATT 240 
CCTCCTGTGG AAGAAACAGT CTTTTATCCT TCTCCCTATC CTATAAGGAG TCTCATAAAA 300 
CCTTTATTTT TTACTGTTGG GTTTACAGGC TGTGCATTTG GATCAGCTGC TATTTGGCAA 3 60 



300 



10 



15 



WO 02/086443 

TATGAATCAC TGAAAT CCAG 
GAT AG C AT AA GACCACAAAA 
AACCTAAGTG ATGGCCAGCG 
TGTTTATGGA GAGTACCTTC 
GCCTCAAAGG TCCTTTGTTC 
CACATGGCAG CAAATATGTA 
GGTCAAGAGC AGTTCATGGC 
TACCTGGGTA AAGTTGCCAC 
ATGACAGTCC TCGCAGCTGT 
CTTCCGATGT TCACGTTCAC 
GCAGGAATGA TCCTGGGATG 
TTTGGAATAT GGTATGTTAC 
GTGAAAATCT GGCATGAAAT 



PCT/US02/12476 



GGTCCAGAGT 
AGAAGGAGAC 
GACTGTGACA 
TCTGCAGCGG 
TCCAATGTTG 
TGTTTTGTGG 
AGTGTACCTA 
AGGAAGATAT 
CTGCACTAAG 
AGCAGGGAAT 
GAAATTTTTT 
TT ACGGT CAT 
AAGGACTAAT 



TATTTTGATG 
TTCAGAAAGG 
GGTATTATAG 
ACAATGATCA 
CTGTCAACAT 
AGCTTCTCTT 
TCTGCAGGTG 
GGACCATCAC 
ATCCCAGAAG 
GCCCTGAAAG 
GATCATGCGG 
GAACTGATTT 
GGCCCCAAAA 



GTATAAAAGC 
AGATTAACAA 
CTGCAAATGT 
GATATTTCAC 
TCAGTCACTT 
CCAG CATAGT 
TTATTTCCAA 
TTGGTGCATC 
GGAGGCTTGC 
CCATTATCGC 
CACATCTTGG 
GGAAGAACAG 
AAGGAGGTGG 



TGATTGGTTG 42 0 

GTGGTGGAAT 480 

CCTTGTATTC 540 

AT CGAATCCA 60 0 

CTCCTTATTT 660 

GAACATTCTG 720 

TTTTGTCAGT 780 

TGGTGCCATC 840 

CATTATTTTC 90 0 

CATGGATACA 960 

GGGAGCTCTT 102 0 

GGAGCCGCTA 1080 
CTCTAAGTAA 



Seq ID NO: 311 Protein sequence: 
Protein Accession #: NP 061092.2 



20 



25 



30 



I 

MAWRGWAQRG 
EPRRSDPGTS 
YESLKSRVQS 
CLWRVPSLQR 
GQEQFMAVYL 
LPMPTFTAGN 
VKIWHEIRTN 



11 

I 

WGCGQAWGAS 
GEAYKRSALI 
YFDGIKADWL 
TMIRYFTSNP 
SAGVISNFVS 
ALKAI I AMDT 
GPKKGGGSK 



21 
I 

VGGRSCEELT 
PPVEETVFYP 
DSIRPQKEGD 
ASKVLCSPML 
YLGKVATGRY 
AGMILGWKFF 



31 
i 

AVLTPPQLLG 
SPYPIRSLIK 
FRKEINKWWN 
LSTFSHFSLF 
GPSLGASGAI 
DHAAHLGGAL 



41 
I 

RRFNFFIQQK 
PLFFTVGFTG 
NLSDGQRTVT 
HMAANMYVLW 
MTVLAAVCTK 
FGIWYVTYGH 



51 
I 

CGFRKAPRKV 60 

CAFGSAAIWQ 12 0 

GIIAANVLVF 180 

SFSSSIVNIL 240 

IPEGRLAI IF 300 

EIiIWKNREPL 3 60 



Seq ID NO: 312 DNA sequence 
Nucleic Acid Accession #: 7M_000625 
Coding sequence: 195.. 3656 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



CTCTCGGCCA 
CACAGGTCTC 
GCCCCACAGT 
GTAAAGCCAT 
ATGCAATGAA 
CCAGTCCAGT 
CCCCGCAGCC 
CAACCCCATT 
TCCAAGACAC 
TGGGGTCCAT 
CAGATGAGCT 
AGGCAAAAAT 
CAGTAACCTA 
ATGCCCCACG 
GCTGTTCCAC 
ACAATGGCAA 
ACTTCCGGGT 
GCATCAGAGG 
AGCCCAAGTA 
CTGAGCTCTT 
ACGAGTGGTT 
TGCTTGAGGT 
CAGAGATCGG 
GCAGGAGAAT 
TTGAGATCAA 
ACCACTCGGC 
GCTGCCCGGC 
TTCACCAGGA 
GGAAAACCCA 
AAGTCTTGGT 
GAGTCAGAGT 
ACCTGGGGGC 
GGCTGAGCTG 
GAGACTGCCC 
ACAACAAATT 
CCTTTGCTCA 
TGGGAGAAGG 
CCTTCAAGGC 
AGCTCTACAC 
AGCCTTTGGA 
GGCTCAAATC 
AACTCTCCTG 
GCCCAGGCAA 
CACCCCACCA 
ACAAGAGGCT 
CACCCCCAAC 
GACAGAGGCT 
GCCCCACATT 
TGCTTTCCCA 
ACACGCCCAC 
AGGGTCCCCT 
CAGTGCCCTG 



11 

I 

CCTTTGATGA 
TTCCTGGTTT 
GAAGAACATC 
AGAGATGGCC 
TGGGGAAAAA 
GACACAGGAT 
CCTCGTGGAG 
GTCCTCCCCA 
ACTTCACCAT 
TATGACTCCC 
TCTACCTCAA 
AGAGGAACAT 
CCAACTGACG 
CTGCATTGGG 
TGCCCGGGAA 
CATCAGGTCG 
GTGGAATGCT 
GGACCCTGCC 
CGGCCGCTTC 
CGAAATCCCA 
TCGGGAACTG 
GGGCGGCCTG 
AGTCCGGGAC 
GGGCCTGGAA 
CATTGCTGTG 
TGCAGAATCC 
AGACTGGATT 
GATGCTGAAC 
TGTCTGGCAG 
CAAAGCTGTG 
CACCATCCTC 
CTTATTCAGC 
CCTGGAGGAG 
TGGCAATGGA 
CAGGTACGCT 
TGACATTGAT 
GGATGAGCTC 
AGCCTGTGAG 
CTCCAATGTG 
CCTCAGCAAA 
TCGGCAGAAT 
TGAGGATGGC 
CCAGCCGGCC 
GGCAGTGCGC 
GCCCCCCTGC 
CCAGCTGCTG 
GGAGGCCCTG 
CCTGGAGGTG 
GCTCCCCATT 
GGAGATCCAC 
GCACCACGGC 
CTTTGTGCGG 



21 



31 



GGGGACTGGG 
GACTGTCCTT 
TGAGCTCAAA 
TGTCCTTGGA 
GGCATCAACA 
GACCTTCAGT 
ACGGGAAAGA 
CGGCATGTGA 
AAGGCCAAAG 
AAAAGTTTGA 
GCTATCGAAT 
CTGGCCAGGG 
GGAGATGAGC 
AGGAT CCAGT 
ATGTTTGAAC 
GCCATCACCG 
CAGCTCATCC 
AACGTGGAAT 
GATGTGGTCC 
CCTGACCTTG 
GAGCTAAAGT 
GAGTTCCCAG 
TTCTGTGATG 
ACGCACAAGC 
CTCCATAGTT 
TTCATGAAGT 
TGGCTGGTCC 
TACGTCCTGT 
GACGAGAAGC 
CTCTTTGCCT 
TTTGCGACAG 
TGTGCCTTCA 
GAACGGCTGC 
GAGAAACTGA 
GTGTTTGGCC 
CAGAAGCTGT 
AGTGGGCAGG 
ACGTTTGATG 
ACCTGGGACC 
GCCCTCAGCA 
CTACAAAGTC 
CAAGGCCTGA 
CTGGTCCAAG 
CTGGAGGCCC 
TCACTCAGCC 
CTCCAAAAGC 
TGCCAGCCCT 
CTAGAGGAGT 
CTGAAGCCCA 
CTGACTGTGG 
GTCTGCAGCA 
AATGCCAGCG 



CAGTTCTAGA 
ACCCCGGGGA 
TCCAGATAAG 
AATTTCTGTT 
ACAATGTGGA 
ATCACAACCT 
AGTCTCCAGA 
GGATCAAAAA 
GGATTTTAAC 
CCAGAGGACC 
TTGTCAACCA 
TGGAAGCGGT 
TCATCTTCGC 
GGTCCAACCT 
ACATCTGCAG 
TGTTCCCCCA 
GCTATGCTGG 
TCACTCAGCT 
CCCTGGTCCT 
TGCTTGAGGT 
GGTACGCCCT 
GGTGCCCCTT 
TCCAGCGCTA 
TGGCCTCGCT 
TCCAGAAGCA 
ACATGCAGAA 
CTCCCATGTC 
CCCCTTTCTA 
GGAGACCCAA 
GTATGCTGAT 
AGACAGGAAA 
ACCCCAAGGT 
TGTTGGTGGT 
AGAAATCGCT 
TCGGCTCCAG 
CCCACCTGGG 
AGGACGCCTT 
TCCGAGGCAA 
CGCACCACTA 
GCATGCATGC 
CGACATCCAG 
ACTACCTGCC 
GCATCCTGGA 
TGGATGAGAG 
AGGCCCTCAC 
TGGCCCAGGT 
CAGAGTACAG 
TCCCGTCCCT 
GGTTCTACTC 
CCGTGGTCAC 
CATGGCTCAA 
GCTTCCACCT 



41 

I 

CAGTCCCGAA 
GGCAGTGCAG 
TGACATAAGT 
CAAGACCAAA 
GAAAGCCCCC 
CAGCAAGCAG 
ATCTCTGGTC 
CTGGGGCAGC 
TTGCAGGTCC 
CAGGGACAAG 
ATATTACGGC 
AACAAAGGAG 
CACCAAGCAG 
GCAGGTCTTC 
ACACGTGCGT 
GCGGAGTGAT 
CTACCAGATG 
GTGCATCGAC 
GCAGGCCAAT 
GGCCATGGAA 
GCCTGCAGTG 
CAATGGCTGG 
CAACATCCTG 
CTGGAAAGAC 
GAATGTGACC 
TGAATACCGG 
TGGGAGCATC 
CTACTATCAG 
GAGAAGAGAG 
GCGCAAGACA 
ATCAGAGGCG 
TGTCTGCATG 
GACCAGTACG 
CTTCATGCTG 
CATGTACCCT 
GGCCTCTCAG 
CCGCAGCTGG 
ACAGCACATT 
CAGGCTCGTG 
CAAGAACGTG 
CCGTGCCACC 
GGGGGAGCAC 
GCGAGTGGTG 
TGGCAGCTAC 
CTACTTCCTG 
GGCCACAGAA 
CAAGTGGAAG 
GCGGGTGTCT 
CATCAGCTCC 
CTACCACACC 
CAGCCTGAAG 
CCCCGAGGAT 



51 

1 

GTTCTCAAGG 60 

CCAGCTGCAA 12 0 

GACCTGCTTT 180 

TTCCACCAGT 240 

TGTGCCACCT 3 0 0 

CAGAATGAGT 3 60 

AAGCTGGATG 42 0 

GGGATGACTT 480 

AAATCTTGCC 54 0 

CCTACCCCTC 60 0 

TCCCTCAAAG 660 

ATAGAAACAA 72 0 

GCCTGGCGCA 7 80 

GATGCCCGCA 840 

TACTCCACCA 90 0 

GGCAAGCACG 960 

CCAGATGGCA 102 0 

CTGGGCTGGA 1080 

GGCCGTGACC 1140 

CATCCCAAAT 12 00 

GCCAACATGC 12 60 

TACATGGGCA 1320 

GAGGAAGTGG 13 80 

CAGGCTGTCG 1440 

ATCATGGACC 150 0 

TCCCGTGGGG 1560 

ACCCCCGTGT 162 0 

GTAGAGGCCT 1680 

ATTCCATTGA 1740 

ATGGCGTCCC 1800 

CTGGCCTGGG 1860 

GAT AAGT ACA 192 0 

TTTGGCAATG 1980 

AAAGAGCTCA 2040 

CGGTTCTGCG 210 0 

CTCACCCCGA 2160 

GCCGTGCAAA 222 0 

CAGATCCCCA 22 80 

CAGGACTCAC 2 34 0 

TTCACCATGA 240 0 

ATCCTGGTGG 2460 

CTTGGGGTTT 2520 

GATGGCCCCA 2580 

TGGGTCAGTG 2 640 

GACATCACCA 2700 

GAGCCTGAGA 2 760 

TTCACCAACA 2 82 0 

GCTGGCTTCC 2880 

CCCCGGGATC 2 940 

CGAGATGGCC 30 00 

CCCCAAGACC 3 060 

CCCTCCCATC 312 0 



301 



10 



15 



WO 02/086443 

CTTGCATCCT CATCGGGCCT 
GGCTCCATGA CTCCCAGCAC 
GCCGCCGCCC AGATGAGGAC 
GGGTGCTGCA TGCGGTGCAC 
TTCAGGACAT CCTGCGGCAG 
CAGGCCACCT CTATGTTTGC 
AGCAGCTGGT GGCTGCCAAG 
AGCT CAAGAG CCAGAAGCGC 
CGAAGAAGGA CAGGGTGGCG 
CTACAGGAGG GGTTAAAGCT 
CTGAGGTCAC AGGGCCTGGG 
TTCCTCAACG TTGCTCCCCA 
ATTGATCGGA GCCTC 



PCT/US02/12476 



GGCACAGGCA 
AAGGGAGTGC 
CACATCTACC 
ACAGCCTATT 
CAGCTGGCCA 
GGGGATGTGC 
CTGAAATTGA 
TAT CACGAAG 
GTGCAGCCCA 
GCCGGCACAG 
GAGATGGAGG 
TCAAGCCCTT 



TCGCGCCCTT 
GGGGAGGCCG 
AGGAGGAGAT 
CCCGCCTGCC 
GCGAGGTGCT 
GCATGGCCCG 
ATGAGGAGCA 
AT AT CTTTGG 
GCAGCCTGGA 
AACTTAAGGA 
AAAGTGATAT 
TACTTGACCT 



CCGCAGTTTC 
CATGACCTTG 
GCTGGAGATG 
TGGCAAGCCC 
CCGTGTGCTC 
GGACGTGGCC 
GGT CGAGGAC 
TGCTGTATTT 
GATGT CAGCG 
TGGAGCCAGC 
CCCCCAGCCT 
CCTAACAAGT 



TGGCAGCAAC 3180 

GTGTTTGGGT 3240 

GCCCAGAAGG 3300 

AAGGTCTATG 33 60 

CACAAGGAGC 3420 

CACACCCTGA 3480 

TATTTCTTTC 3540 

CCTTACGAGG 3600 

CTCTGAGGGC 3660 

TCTGCATTAT 372 0 

CAAGTCTTAT 3780 

AGCACCCTGG 3840 



Seq ID NO: 313 Protein sequence: 
Protein Accession #: NP_000616 



20 



25 



30 



35 



40 



MACPWKFLFK 
VETGKKSPES 
TPKSLTRGPR 
LTGDELI FAT 
RSAITVFPQR 
RFDWPLVLQ 
GLEFPGCPFN 
AVLHSFQKQN 
LNYVLtSPFYY 
ILFATETGKS 
NGEKLKKSLF 
ELSGQEDAFR 
SKALSSMHAK 
PALVQGILER 
LLLQKLAQVA 
PILKPRFYSI 
VRNASGFHLP 
EDHIYQEEML 
V CGD VRMARD 
VAVQPSSLEM 



11 
I 

TKFHQYAMNG 
LVKLDATPLS 
DKPTPPDELL 
KQAWRNAPRC 
SDGKHDFRVW 
ANGRDPELFE 
GWYMGTE I GV 
VTIMDHHSAA 
YQVEAWKTHV 
EALAWDLGAL 
MLKELNNKFR 
SWAVQTFKAA 
NVFTMRLKSR 
WDGPTPHQA 
TEEPERQRLE 
SSPRDHTPTE 
EDPSHPCILI 
EMAQKGVLHA 
VAHTLKQLVA 
SAL 



21 
I 

E KG I NNNVEK 
SPRHVRIKNW 
PQAIEFVNQY 
IGRIQWSNLQ 
NAQLIRYAGY 
IPPDLVDEVA 
RDFCDVQRYN 
ESFMKYMQNE 
WQDEKRRPKR 
FSCAFNPKW 
YAVFGLGSSM 
CET FDVRGKQ 
QNLQSPTSSR 
VRLEALDESG 
ALCQPSEYSK 
IHLTVAWTY 
GPGTGIAPFR 
VHTAYSRLPG 
AKLKLNEEQV 



31 
1 

APCATSSPVT 
GSGMTFQDTL 
YGSLKEAKIE 
VFDARSCSTA 
QMPDGSIRGD 
MEHPKYEWFR 
I LEEVGRRMG 
YRSRGGCPAD 
REIPLKVLVK 
CMDKYRIiSCL 
YPRFCAFAHD 
HIQIPKLYTS 
ATILVELSCE 
SYWVSDKRLP 
WKFTNSPTFL 
HTRDGQGPLH 
SFWQQRLHDS 
KPKVYVQD I Ii 
EDYFFQLKSQ 



41 



QDDLQYHNLS 
HHKAKG I LTC 
EHLARVEAVT 
REMFEHICRH 
PANVEFTQLC 
ELELKWYALP 
LETHKLASLW 
WIWLVPPMSG 
AVLFACMLMR 
EEERLIjIjWT 
IDQKLSHLGA 
NVTWDPHHYR 
DGQGLNYLPG 
PCSLSQALTY 
EVLEEFPSLR 
HGVCSTWLNS 
QHKGVRGGRM 
RQQLASEVLR 
KRYHEDI FGA 



51 
I 

KQQNESPQPL 60 

RSKSCLGSIM 120 

KEIETTVTYQ 180 

VRYSTNNGNI 240 

IDLGWKPKYG 3 00 

AVANMLLEVG 360 

KDQAWEINI 42 0 

SITPVFHQEM 480 

KTMASRVRVT 540 

STFGNGDCPG 600 

SQLTPMGEGD 660 

LVQDSQPLDL 720 

EHLGVCPGNQ 780 

FLDITTPPTQ 840 

VSAGFLLSQL 90 0 

LKPQDPVPCF 960 

TLVFGCRRPD 102 0 

VLHKEPGHLY 1080 

VFPYEAKKDR 1140 
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Seq ID NO: 314 DNA sequence 
Nucleic Acid Accession #: XM_087254 
Coding sequence: 47.. 2332 



50 



55 



60 



65 



70 



75 



80 



85 



AGAGTACGTG 
ATGTTCAATT 
AACACCAGAC 
CTTATCCCAT 
AATTAAAGAA 
CAATGTTCAA 
GTTGGAGTAC 
TGGTATTGTG 
GGAACGGTAC 
AATTGTTCAG 
TCTCCCTAAA 
TTTGAAAGGG 
GGAAATAGAT 
GGCAGCTGTT 
AGACAGACTA 
AGTATGGGTA 
CCATTTTCAT 
TGCTGAACAA 
GCTGGTAGTG 
GGAAGTTTGC 
AAAAGTAATA 
TGGTGCTAAT 
AGAAGGAAGA 
CAAATTGCTT 
TTTTTTTTAT 
GTTTTCTCAG 
TTCCCTACCT 
AAATAAGCCC 
TCTTTATTGG 
ACTAATAGGG 
TGGCACTTTG 
TCATTTTTGG 
ATTTTCCTTG 
TGTGTTTATT 
TACATGTCTA 
TACTGAAAAG 
CTGTTTCCCG 
AGGAAGATGT 
CAACGACAGG 



11 

I 

TTTACAGATA 
AATGGCATGA 
TCTTCAGAAG 
CTTACAACCA 
CATGATCTCT 
ACTGACTGCA 
TATGCATCTT 
TTTATTGGCA 
AAACTGCTTC 
GCACCTTCAG 
TGTATAGGTG 
CTAAGAACTC 
AAACGCATAT 
TTCCAGTTCA 
CAAGATAAAG 
CTTACTGGGG 
AGAACCATGA 
TTGAGGCAGC 
GATGGGACCA 
AGAAATTGTT 
AGACTAATAA 
GACGTAAGCA 
CAGGCTGCAA 
TTTGTTCATG 
AAGAATGTGT 
CAAACATTGT 
ATTCTGATAT 
ACCCTTTATC 
ACCATCCTGG 
AAAGATACAT 
GTCTTCACAG 
ACTTGGATCA 
TTTTATGGAG 
CAGCTCCTGT 
TTTCTTGATA 
GCACAGCTTA 
GAAGGAGAAG 
AGTCCAACCC 
AGCATCTTGA 



21 



AAACTGGTAC 
AATACCAAGA 
GAAACTTATC 
GTTCCTCTTT 
TCTTTAAAGC 
CTGGTGATGG 
CACCAGATGA 
ATTCTGAAGA 
ATATTCTGGA 
GTGAGAAGTT 
GAGAAATAGA 
TGTGTATAGC 
TTGAAGCCAG 
TAGAGAAAGA 
TTCGAGAAAC 
ATAAACATGA 
ACATCCTTGA 
TTGCCAGAAG 
GCCTATCTCT 
CAGCTGTATT 
AAATATCACC 
TGATACAAGA 
GAAACAGTGA 
GTCATTTTTA 
GCTTTATCAC 
ATGACAGCGT 
ATAGTCTTTT 
GAGACATTAG 
GCTTCAGTCA 
CTCTGCTTGG 
T CATGGTT AT 
ACCATCTCGT 
GGATTCTCTG 
CAAGTGGTTC 
TCATAAAGAA 
CTGAAACAAA 
CAGCGTGTGC 
ACATCAGCAG 
CTCTCTCCAC 



31 

1 

ACTGACAGAA 
AATTAATGGT 
TTATCTTAGT 
CAGAACCAGT 
AGTCAGT CTC 
TCCCTGGCAA 
AAAGGCTCTA 
AACTATGGAG 
ATTTGATTCA 
ATTATTTGCT 
AAAAACCAGA 
ATATAGAAAA 
GACTGCCTTG 
CCTGATATTA 
TATTGAAGCA 
AACAGCTGTT 
ACTTATAAAC 
AATTACAGAG 
TGCACTCAGG 
ATGCTGTCGT 
TGAGAAACCT 
AGCCCATGTT 
CTATGCAATA 
TTATATTAGA 
ACCCCAGTTT 
GTACCTGACT 
GGAACAGCAT 
TAAAAACCGC 
TGCCTTTATT 
AAATGGCCAG 
TACAGTCACA 
TACCTGGGGA 
GCCATTTTTG 
TGCTTGGTTT 
GGTCTTTGAC 
TGCAGGTATC 
ATCTGTTGGA 
ATCATGGAGT 
AATGGACTCA 



41 



51 



AATGAGATGC 
AGACT TGTAC 
AGTTTATCCC 
CCTGAAAATG 
TGTCACACTG 
TCCAACCTGG 
GTAGAAGCTG 
GTTAAAACTC 
GATCGTAGGA 
AAAGGAGCTG 
ATTCATGTAG 
TTTACATCAA 
CAGCAGCGGG 
CTTGGAGCCA 
TTGAGAATGG 
AGTGTGAGTT 
CAGAAATCAG 
GATCATGTGA 
GAGCATGAAA 
ATGGCTCCAC 
ATAACATTGG 
GGCATAGGAA 
GCCAGATTTA 
ATAGCTACCC 
TTATATCAGT 
TTATACAATA 
GTAGACCCTC 
CTCTTAAGTA 
TTCTTTTTTG 
ATGTTTGGAA 
GTAAAGATGG 
TCTATTATAT 
GGCTCCCAGA 
GCCATAATCC 
CGACACCTCC 
AAGTGCTTGG 
AGAATGCTGG 
GCATCGGATC 
TCTACTTGTT 



AGTTT CGGG A 60 

CCGAAGGACC 12 0 

ATCTTAACAA 180 

AAACTGAACT 240 

TACAGATTAG 3 00 

CACCATCGCA 3 60 

CTGCAAGGAT 42 0 

TTGGAAAACT 480 

GAATGAGTGT 540 

AGTCAT CAAT 600 

ATGAATTTGC 660 

AAGAGTATGA 720 

AAGAGAAATT 780 

CAGCAGTAGA 840 

CTGGTATCAA 900 

TATCATGTGG 960 

ACAGCGAGTG 1020 

TTCAGCATGG 10 80 

AACTATTTAT 1140 

TGCAGAAAGC 12 0 0 

CTGTTGGTGA 12 60 

TCATGGGTAA 132 0 

AGTTCCTCTC 13 80 

TTGTACAGTA 1440 

TCTACTGTTT 1500 

TTTGTTTTAC 1560 

ATGTGTTACA 162 0 

TTAAAACATT 1680 

GATCCTATTT 1740 

ACTGGACATT 1800 

CTCTGGAAAC 1860 

TTTATTTTGT 192 0 

ATATGTATTT 1980 

TCATGGTTGT 2 040 

ACCCTACAAG 2100 

ACTCCATGTG 2160 

AACGAGTTAT 222 0 

CTTTCTATAC 2280 

AAAGGGG CAG 23 40 
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20 
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TAGTACTTTG TGGGAGCCAG 
ATGGCCACAC TAGCTCTGAA 
GAGTTATAAT GGCAAACAAA 
TGAATCTGAA CATGTTAAAA 
TGTCCCTTGT GCTTATGGGA 
TTTAATATAA ATGTAGAAAA 
TTGATTATTG ACTCTTCTAT 
AGAACTCTAT TTTTTTATTA 
ATACTGAGGA ATTTTGGTCC 
TTCACAGAGC AAATTAGGAG 
ATTTATACCA ATTCCTCTAA 
CAAGGGTATA TCATATATAC 
GTTTACTAAT ATTTTTGTGA 
TAGCATATTA TTAATTTAAT 
ACATATTTAA ATTTGCTTTT 
CATCGTTGTA CAGTTTAACT 
TATGT TTAAT TATACAAATC 
CTCTTTCTGC AGCCGACTTA 
AGGGTTT CAG TTAATAATCT 
CAATACAGTG AGTTCTGCCA 
TGTAAAAATG CTCAACTTGT 
TAATCGGGTA CATGTTACTG 
AATTTATCAA GTAGTT CAGT 
TTAAGATTTA GAAGTGATTA 
TTGTATACAT ATTAAGATAA 
AATTCCTTTA TGGAGATTTA 
GGCTTCTAGA ATTGGACTGG 
CTTGTTTGCT TGTAAACTAT 
TAAGGATATT AAGTTATTAA 
GATATTTCAT AGCTGGATTT 
CAACGTACAA TGTCTGCATT 
CTCAGTAGAG TACTAGGTGG 
TGCATATAAC AAAATGACAC 
G CC ATCAAAT AAACTGAGTA 
TGACCAACTG CAGCAAGACA 
ATGTAATTTT CTGTACT C AC 
AAGTAAATGG CAACCACTAG 
TTAAAGCAAA ATTATCTTGT 
CAATG CAGT C TGCAAGCTTT 
ACTACGTAAC CAGTAATCAC 
CTTTGGAAAG TATGATGTTG 
GCTAAATACG TTATTGCTAA 
GAGGGCTGTA AGCCTGAAGA 
GCTGCTTTAA GTGACTCAGC 
GGAGCAAAGT ATGGGCCAGG 
AGGGGAGAAT TTATGGTCTG 
ATACACAAAG GCTTCCAGAC 
CAGAGGCAAA TCAACCCTAG 
AGGTCATTTC TACTGGAAAA 
ATAGGCAGGA GTCAAGGCCA 
TGCTACTCTG AAAAATCTCG 
TTTTCCTGTA AAGATCAGTT 
CAAAGAGTTA CGTAAAACAT 
CTATTTTGAA ATGAGTTATC 
TGTGAAATAA CTTGAATGTT 
AATCATGGTA ATTTAGATTT 
GGTTTAAAAT TTTGGACCTG 
TGCATTGTCA GTAAATGTAG 
GAAGTTATAT TT ATCAAAT A 



TTCACCTCCT 
ATTAATTTCC 
CAGAAAGCAT 
TTTGAGAATA 
CTCCTAATGG 
AAGAGAGAAA 
TTAAATCTGC 
GAGTTATATT 
CTCAGTGACC 
AATCATTTCC 
CTGTACTGTA 
AAATCAGGAA 
CAGAGTATAA 
GTCTTTATCA 
TTTCTCTTTA 
ATATCAATAA 
AGAATAGTAT 
GACATGCTCT 
TATTTTCAGG 
GTGTCCCAGT 
ATCAGGTAAT 
TAATTAACTC 
ATTGTCATTT 
TTAGCTTGAG 
TGGTTAAATG 
TTGTGCAGCC 
CAGGGGAAAG 
TATTTTCTTG 
GCTAAATATT 
AGGAAGATCT 
CACTAATTCA 
GAGGATATGG 
CCAGTAGGCC 
CTGACACCAG 
GGAGGTCAGC 
CATTTGAAGT 
TGTGCTCATC 
GATTTTAAGA 
CAGTAGTTTT 
AAGGAAAGTG 
ATAATTAACT 
TCAGTGGTCT 
TAGTGGCAAG 
ACCCTGCCTC 
GAGAACTACA 
AATTTTCTAA 
CTGAGCCACA 
GAAATACTTG 
GATTGTGAGA 
CTAGAAAATT 
TGAAGGCTGT 
TGGGGTATGA 
GTTTTATTAA 
TATTTTCATA 
GTTCCTATAA 
TTATGAGGAA 
AGACACTGTG 
TATATTATTG 
AAAACTTTCC 



TTCCTAAAAT 
AAAATCTTTG 
TAGTACAAGC 
AAGAGACATT 
CATTTCAGTC 
TCTTAGTAAA 
TTCTGTAAAT 
TAAAGCTTTT 
TGTGTTGTTA 
AACCATTATT 
ACACAGCCTG 
TCAGGTCCGT 
AGACCCTATA 
TTGGATCTTT 
CCTGAAGGCT 
AAAGTTTGGA 
GGGTAATTAA 
TCCCTTTCTA 
TTATGTCATC 
ACAAGGCATA 
GTTAGCAATA 
ATTGCACTTC 
GTTTTTGTTT 
AACTATTACC 
CGGTTTTACC 
CTAAGCTTCC 
AATGGTAGAG 
CTAATGTAAC 
AATTTTCAAA 
GTTATTCTGG 
TGTTCCAGAA 
AAATTTGCTC 
TGCATTACAT 
ACAAAGACTC 
TCGCCTATAA 
TAGTTAAGGA 
CTGAACTGTT 
AAAGAGTTTT 
CTAGTGCTAT 
TCCCCTTTGC 
TACCCTTATC 
CAAATCGATT 
CACCAAGTCA 
AGCTTCAGCA 
GCTACGAAGA 
CTGTCCTCTT 
CCCAGGCCCT 
CATTCTGCCC 
TTGAACTTAT 
GACAGTTAAG 
AGGAAAAGGG 
TATAAGCAGG 
TTTTGGTCCC 
AAAGTAAAAC 
AAAATAGATC 
TGAGTATCTG 
GCTGTCTAAT 
TACAGCTACT 
TATAT 



TCAGTGTGAT 
TAGTAGTTCA 
CCCTCCCAAC 
TTTCATCTCT 
TGTTGCTGAG 
GAGTATTTTT 
TATGCTGAAA 
CATGGGAAAA 
ATT CATTAAT 
TACTGCAGTA 
TAAAGTTAGC 
TCACCGAACT 
GTGGGTAAAT 
TGCATGCTTT 
CTGTGTATAG 
CAGTATTTAA 
ATGAATACAA 
TAAG CTAGAT 
TAACTTATAG 
TTTCAGGTGT 
AATTAAATGC 
AAAACCTAAC 
TATTGAAAAG 
CAGCTCTAAG 
AAGTTTTCCC 
TTCCCATTTC 
ACAGAAATTA 
ATTTGTCTGT 
AATAGTCCTT 
AAGTACTAAA 
GAGGAAATAA 
ATAAAATCTC 
TTACATGACC 
CAAAGTCATA 
TGGTGCTTAA 
GAACTTTATT 
ACTCCAAATC 
CTATTTATTT 
ATTCATCCTG 
ATATTTCTTT 
TGCCAAAACC 
TGCCTCCCTT 
GTTTCCAAAA 
GGCGTAGGCT 
CCTGCTGTCG 
TCTTGGGTCT 
ATCCTGAACA 
TACGGTTAGT 
CTGATCGCTT 
AGCCAAAAGT 
AGAATCTTCC 
TATTAATAAA 
CACGTACAGA 
ACTATTAAAG 
ATAACTCATG 
GAAATATTGT 
GTAATCCTTT 
CATAATTTTT 



CACCCTGTTA 2400 

TACCCACTCA 2460 

ACCCTTAATT 252 0 

TTGTCTGGTT 2 580 

GCCATTATAT 2 640 

TAGTATTAGC 2700 

GTTTGCCTTG 2760 

GTTAATGTGA 2820 

GCATTCTGAG 2880 

TGGGG AGT AA 2940 

CATATAAATG 3000 

TCAAATTGAT 3060 

TAGATACTAT 3120 

AATCTGGTTA 3180 

TATTTCATGA 3240 

ATATTGCAAA 3300 

AAAGAAGAGC 3360 

TTTAGAATAA 342 0 

CAAACTACCA 348 0 

GGCTGTGGAA 3540 

TAAGAATGAT 3 600 

TTCCATCCTG 3 660 

TAATGTTGT C 372 0 

CAAATAATGA 3780 

TTGAAAATGT 3840 

ATGAATATAA 3900 

AGACTTTATC 3 960 

TCCAGTGATG 402 0 

CTTTAACTTA 4080 

AAGAATAATA 4140 

TGAAGATATA 4200 

TTATAAAACG 4260 

GTGTTTATTT 4320 

AAATAGCCTA 4380 

AGTGTGATTG 4440 

TTTTTAAAAA 4500 

CACTCCGTTT 4560 

AAGAAAGTAA 462 0 

TAAAACTCTT 4680 

AAAATTCTTT 4740 

AGAGCAAAAT 4800 

TGCCTCGTCT 4860 

TTGCCCCTCA 4920 

CACCCTGGGC 4 980 

AGTTGAGAAA 5040 

AAAGCTCATA 5100 

GGAGACTAAA 5160 

ACCAGGACTG 5220 

GAGACTCCTA 5280 

TTTTAAAATA 5340 

ATGTTGGTGT 5400 

AATAACACAC 5460 

CATTTTATTT 5520 

TGCTGTTTTA 5580 

ATATGTTTGT 5640 

AGCAATACTT 5700 

AAAAATTCTC 5760 

T AAAGTT TAT 5820 
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Seq ID NO: 315 Protein sequence: 
Protein Accession #: XP_087254 
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MQFRECSING 
NETELIKEHD 
AAARIGIVFI 
AESSILPKCI 
REEKLAAVFQ 
SLSCGHFHRT 
EKLFMEVCRN 
GIMGKEGRQA 
QFYCLFSQQT 
SIKTFLYWTI 
MALETHFWTW 
ILMWTCLFL 
LERVIGRCSP 



11 

t 

MKYQEINGRL 
LFFKAVSLCH 
GNSEETMEVK 
GGEIEKTRIH 
FIEKDLILLG 
MNILELINQK 
CSAVLCCRMA 
ARNSDYAIAR 
LYDSVYLTLY 
LGFSHAFIFF 
INHLVTWGSI 
D I I KKVFDRH 
THISRSWSAS 



21 
i 

VPEGPTPDSS 
TVQISNVQTD 
TLGKLERYKL 
VDEFALKGLR 
ATAVEDRLQD 
SDSECAEQLR 
PLQKAKVIRL 
FKFLSKLLFV 
NICFTSLPIL 
FGSYLLIGKD 
IFYFVFSLFY 
LHPTSTEKAQ 
DPFYTNDRSI 



31 
I 

EGNLSYLSSL 
CTGDGPWQSN 
LHILEFDSDR 
TLCIAYRKFT 
KVRET I EALR 
QLARRITEDH 
IKISPEKPIT 
HGHFYYIRIA 
IYSLLEQHVD 
TSLLGNGQMF 
GGILWPFLGS 
LTETNAGIKC 
LTLSTMDSST 



41 
I 

SHLNNLSHLT 
LAPSQLEYYA 
RRMSVIVQAP 
SKEYEEIDKR 
MAG I KVWVLT 
VIQHGLWDG 
LAVGDGANDV 
TLVQYFFYKN 
PHVLQNKPTL 
GNWTFGTLVF 
QNMYFVFIQL 
LDSMCCFPEG 
C 



51 
I 

TSSSFRTSPE 
SSPDEKALVE 
SGEKLLFAKG 
IFEARTALQQ 
GDKHETAVSV 
TSLSLALREH 
SMIQEAHVGI 
VCFITPQFLY 
YRDISKNRLL 
TVMVITVTVK 
LSSGSAWFAI 
EAACASVGRM 



Seq ID NO: 316 DNA sequence 
Nucleic Acid Accession #: NM_J)04473 
Coding sequence: 661.. 1791 
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l l l l 

CTCGCCAGCG GTCCGCGGGG CTGGAGACCC ACGCCGTGGA GAGGACCAGC CTCAGGTCGC 



60 
120 
1B0 
240 
300 
360 
420 
480 
540 
600 
660 
720 
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CCCGCCTGGG CCCGCGCCCC GACCTCGCTG CCCCCGCCTC GCCTCTCTGC CCGTGGCGCT 120 

'TACCGCCACC TTGGCCTCGG GGG CAGGGCA TGGGCGGCCC CCGCCAGATC GCCCAGCGCC 180 

AGTACTAACT GCCCTCGCTC TGGCCTTCGA GCCCGAAGCC TCTTCTGCGC GCACAACCTA 240 

GGCAGTAATC CTAAACTAGC GGG C AC C ACA GACCAGCTGC AGCCACCCCA ACCCAGGGAT 300 

5 CACTTCCGGA CCCCTCGACC GCCCGGCACC AGCG CGCAAG GGACCCTTCA GCCGGAGACC 360 

AGAGTCCAGT CCCGGTCGCG AGGCCACCGC CGCTGCCCGC CTCGAGAAGC ACAACGCGGG 42 0 

CTGAGCCGTC GGCTAGCGGG TCACTCCCGA GCCTCTGTCT GCACCGCGCC AGCCCCAGAC 480 

CACGGACGCT GAGCCTCCAG CGCGCGCCAG CCTGGGCCGC TGGGCTCTCC GGGCCAGCCC 540 

GCGACGATCC CCTGAGCTCT CCGCAGAAGG GCCGAGCGTC CGTTCCGGGG ACGCCAGGCC 60 0 

10 CGCCCCCGCC CCCCGACAGC CGCGGGGATC CAGAGCCCGG GGGTGCGGGA CGCCCGCGCC 660 

ATGACTGCCG AGAGCGGGCC GCCGCCGCCG CAGCCGGAGG TGCTGGCTAC CGTGAAGGAA 720 

GAGCGCGGCG AGACGGCAGC AGGGGCCGGG GTCCCAGGGG AGGCCACGGG CCGCGGGGCG 780 

GGCGGGCGGC GCCGCAAGCG CCCCCTGCAG CGCGGGAAGC CGCCCTACAG CTACAT CGCG 840 

CTCATCGCCA TGGCCATCGC GCACGCGCCC GAGCGCCGCC TCACGCTGGG CGGCAT CT AC 900 

15 AAGTTCATCA CCGAGCGCTT CCCCTTCTAC CGCGACAACC CCAAAAAGTG GCAGAACAGC 960 

ATCCGCCACA ACCTCACACT CAACGACTGC TTCCTCAAGA TCCCGCGCGA GGCCGGCCGC 1020 

CCGGGTAAGG GCAACTACTG GGCGCTCGAC CCCAACGCGG AGGACATGTT CGAGAGCGGC 1080 

AGCTTCCTGC GCCGCCGCAA GCGCTTCAAG CGCTCGGACC TCTCCACCTA CCCGGCTTAC 1140 

ATGCACGACG CGGCGGCTGC CGCAGCCGCC GCTGCCGCAG CCGCCGCCGC CGCCGCCGCC 120 0 

20 GCCGCCATCT TCCCAGGCGC GGTGCCCGCC GCGCGCCCCC CCTACCCGGG CGCCGTCTAT 1260 

GCAGGCTACG CGCCGCCGTC GCTGGCCGCG CCGCCTCCAG TCTACTACCC CGCGGCGTCG 1320 

CCCGGCCCTT GCCGCGTCTT CGGCCTGGTT CCTGAGCGGC CGCTCAGCCC AGAGCTGGGG 13 80 

CCCGCACCGT CGGGGCCCGG CGGCTCTTGC GCCTTTGCCT CCGCCGGCGC CCCCGCTACC 1440 

ACCACCGGCT ACCAGCCCGC AGGCTGCACC GGGGCCCGGC CGGCCAACCC CTCTGCCTAT 1500 

25 GCGGCTGCCT ACGCGGGCCC CGACGGCGCG TACCCGCAGG GCGCCGGCAG TGCGATCTTT 1560 

GCCGCTGCTG GCCGCCTGGC GGGACCCGCT TCGCCCCCAG CGGGCGGCAG CAGTGGCGGC 162 0 

GTGGAGACCA CGGTGGACTT CTACGGGCGC ACGTCGCCCG GCCAGTTCGG AGCGCTGGGA 1680 

GCCTGCTACA ACCCTGGCGG GCAGCTCGGA GGGGCCAGTG CAGGCGCCTA CCATGCTCGC 1740 

• CATGCTGCCG CTTATCCCGG TGGGATAGAT CGGTTCGTGT CCGCCATGTG AGCCAGCGTA 18 00 

30 GGGACGAAAA CTCATAGACA CATCGGCTGT TCACACGTTC CCCGCAACCT GAGAACGAAC 18 60 

AGGAATGGAG AGAGGACTCA ACTGGGACCC ACGTGGAAAA GACCGAGCAG GCCACAGAGG 192 0 

CTCGGTCTCC CCGCGCACAG CGTAGGCACC CTGTGTACTC TGTAAACGGG AGGAGGTGGG 1980 

GCGAGGCAGC CAGAGCCCTT GGACTGGCAC AGGGACCCTC GATGGAGCGA AGCCCTCAAA 2 040 

CGGGATGCTT TCTGGCATTC TATCGGGGAG GGTCCTTGGC GGTAACCAGA GGGCAGCGTA 210 0 

35 GTGTCAACAC CAGAGACCAG GATCCAAATT GTGGGGAATC AGTTTCAGCC TTCCATGTGC 2160 

TGCCGGAACT CGGGCCTTTT TACGCGGTTC GTCCTCTAGT GCCTTTAACT GCGTTACTAC 222 0 

AATAAAAGGC TGCGGCAGCG CCTTTCTTCT TAAAGTGAGG AGGACAAATT TGCAAAAGAA 22 80 

ATAGGCTTTT CTTCTTTTTT AAATTGGAGA AATCT CTGCT CTGGTTGACC TGGGCTGGTT 2340 

TTCCCTGTCT CTGAGAACTT GAGACCTAGC TCCGAGTTGA ACTGTGCGTC AGCACTCCAG 240 0 

40 TCCCATCACC TGAACCTTCA GTCTCCCCCA TCTGTTACAC TAGAGGGCTG CAGGACTCTA 2460 

TCCACCGCCC CCGGGTTATC ATTCAGGGCC CCATCATCTT GGATGCTGCC CTGCGTATTT 252 0 

GGCAGCAATG GTGGGCCACC CAGGGCCTCT GAGTAGCCAC CCAAAGCCTA GCCGCTGTTC 25 80 

TAGGGAACGG AAAAGAGTTC ATGGCCAAGC GTCTAACCTA AAGTCCCAGG ATTGGCTCCA 2 640 

GGCAGCAATT ATATCATAAC TTATTGAACT TTTGAGCAGG ACGTGCTGGT AATTTCATGG 2 70 0 

45 CTGTTACTGC CCAGTCATAA ATCTGCTTTT CCATTATAAG GCAGAGAGAA GTACATTCGT 2760 

TCATTTGTCC ACTGTTTCTT GTCATCACGC AGCCCTGGAC CCAAAGGGTG AACTAAAGTT 282 0 

TAAGGAGATG AGAGGATTCA AGGAGCCCGT TGGTGACGCC TTTCAGTAGC TGGGGAGGGC 2 88 0 

TCTTCCATCC CCAGCACCCC CTGCTACACC TCAGCAGCCT CCCCCATGCA AAAAGGAAAG 2 940 

AGAAAAATTA AGTTAGGGCA GTCAGTAAAG TGAGCTTTAG AAAGAAACTG GAATTTTAAC 3 0 00 

50 TTCATTTTGT ATCTTGCTTA AGTAGCAGGC TCACTAAAAT TAGAGAAAGT CCAATAACTC 3 0 60 

TCCCCCTTTC CCTTGAGAAA TCTTTAAGTT TCGATTCTGG AGCAAAAACT TTCAGCATTA 312 0 

AATATTTCAG AGGCTCCATT CACAGCTTTC AGATAAACTG GAGTGTTCAG ATGGACTGTT 3180 

TTAATAAAAA TCTTTGAGCA AGTGAGTTAT GGCAAGAGAA ACTCAGCCTC TTTCTGTATA 3240 

AACTTAACAG GGAAGGGCTG GGGTGTGAAA AAGAAGATTG TATGAAAACC ATTGGTAATT 3300 

55 TTTATTTTTT ATTTTTGGGA CTGCACTATC CTGTTCACGA AGACATGTGA ACTTGGTTCA 33 60 

GTCCAAATGG GGATTTGTAT AAACCAGTGC TCTCCATTAG AAATATGGTG CAAGCCACAT 3420 

ATGTAATTTT AAATATTCTA GTAGCCACAT TAATAAAGTN AAAAGAAACA AAAAAAAAAA 3 4 80 
AA 

60 Seq ID NO: 317 Protein sequence: 
Protein Accession #: NP_Q04464 
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1 11 21 31 41 51 

t-c \ I I I I I 

OD FKHLTHYROI DTRANSCRIP TIONF ACTOR TTFMTAESGP PPPQPEVLAT VKEERGETAA 60 

GAGVPGEATG RGAGGRRRKR PLQRGKPPYS YIALIAMAIA HAPERRLTLG GIYKFITERF 12 0 

PFYRDNPKKW QNSIRHNLTL NDCFLKIPRE AGRPGKGNYW ALDPNAEDMF ESGSFIjRRRK 180 

RFKRSDLSTY PAYMHDAAAA AAAAAAAAAA AAAAAIFPGA VPAARPPYPG AVYAGYAPPS 240 

LAAPPPVYYP AASPGPCRVF GLVPERPLSP ELGPAPSGPG GSCAFASAGA PATTTGYQPA 3 00 

70 GCTGARPANP SAYAAAYAGP DGAYPQGAGS AIFAAAGRLA GPASPPAGGS SGGVETTVDF 360 
YGRTSPGQFG ALGACYNPGG QLGGASAGAY HARHAAAYPG GIDRFVSAM 



75 



Seq ID NO: 318 DNA sequence 
Nucleic Acid Accession #: NM_005688 
Coding sequence: 126.. 4439 



1 11 21 31 41 51 

OA I I I I I I 

OU CCGGGCAGGT GGCTCATGCT CGGGAGCGTG GTTGAGCGGC TGGCGCGGTT GTCCTGGAGC 60 

AGGGGCGCAG GAATTCTGAT GTGAAACTAA CAGTCTGTGA GCCCTGGAAC CTCCGCTCAG 12 0 

AGAAGATGAA GGATAT CGAC ATAGGAAAAG AGTATATCAT CCCCAGTCCT GGGTATAGAA 180 

GTGTGAGGGA GAGAACCAGC ACTTCTGGGA CGCACAGAGA CCGTGAAGAT TCCAAGTTCA 240 

GGAGAACTCG ACCGTTGGAA TGCCAAGATG CCTTGGAAAC AGCAGCCCGA GCCGAGGGCC 3 00 

85 TCTCTCTTGA TGCCTCCATG CATTCTCAGC TCAGAATCCT GGATGAGGAG CATCCCAAGG 3 60 

GAAAGTACCA TCATGGCTTG AGTGCTCTGA AGCCCATCCG GACTACTTCC AAACACCAGC 420 

ACCCAGTGGA CAATGCTGGG CTTTTTTCCT GTATGACTTT TTCGTGGCTT TCTTCTCTGG 480 



304 
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CCCGTGTGGC CCACAAGAAG GGGGAGCTCT CAATGGAAGA CGTGTGGTCT CTGTCCAAGC 540 

ACGAGTCTTC TGACGTGAAC TGCAGAAGAC TAGAGAGACT GTGGCAAGAA GAGCTGAATG 60 0 

AAGTTGGGCC AGACGCTGCT TCCCTGCGAA GGGTTGTGTG GATCTTCTGC CGCACCAGGC 660 

TCATCCTGTC CATCGTGTGC CTGATGATCA CGCAGCTGGC TGGCTTCAGT GGACCAGCCT 720 

TCATGGTGAA ACACCTCTTG GAGTATACCC AGGCAACAGA GTCTAACCTG CAGTACAGCT 780 

TGTTGTTAGT GCTGGGCCTC CTCCTGACGG AAATCGTGCG GTCTTGGTCG CTTGCACTGA 840 

CTTGGGCATT GAATTACCGA ACCGGTGTCC GCTTGCGGGG GGCCATCCTA ACCATGGCAT 900 

TTAAGAAGAT CCTTAAGTTA AAGAACATTA AAGAGAAATC CCTGGGTGAG CTCATCAACA 960 

TTTGCTCCAA CGATGGGCAG AGAATGTTTG AGGCAGCAGC CGTTGGCAGC CTGCTGGCTG 1020 

GAGGACCCGT TGTTGCCATC TTAGGCATGA TTTATAATGT AATTATTCTG GGACCAACAG 1080 

GCTTCCTGGG ATCAGCTGTT TTTATCCTCT TTTACCCAGC AATGATGTTT GCATCACGGC 1140 

T C ACAG CAT A TTTCAGGAGA AAATGCGTGG CCGCCACGGA TGAACGTGTC CAGAAGATGA 1200 

ATGAAGTTCT TACTTACATT AAATTT AT CA AAATGTATGC CTGGGTCAAA GCATTTTCTC 1260 

AGAGTGTTCA AAAAATCCGC GAGGAGGAGC GTCGGATATT GGAAAAAGCC GGGTACTTCC 1320 

AGGGTATCAC TGTGGGTGTG GCTCCCATTG TGGTGGTGAT TGCCAGCGTG GTGACCTTCT 13 80 

CTGTTCATAT GACCCTGGGC TTCGATCTGA CAGCAGCACA GGCTTTCACA GTGGTGACAG 1440 

TCTTCAATTC CATGACTTTT GCTTTGAAAG TAACACCGTT TTCAGTAAAG TCCCTCTCAG 1500 

AAGCCTCAGT GGCTGTTGAC AGATTTAAGA GTTTGTTTCT AATGGAAGAG GTTCACATGA 1560 

TAAAGAACAA ACCAGCCAGT CCTCACATCA AGATAGAGAT GAAAAATGCC ACCTTGGCAT 162 0 

GGGACTCCTC CCACTCCAGT ATCCAGAACT CGCCCAAGCT GACCCCCAAA ATGAAAAAAG 1680 

ACAAGAGGGC TTCCAGGGGC AAGAAAGAGA AGGTGAGGCA GCTGCAGCGC ACTGAGCATC 1740 

AGGCGGTGCT GGCAGAGCAG AAAGGCCACC TCCTCCTGGA CAGTGACGAG CGGCCCAGTC 1800 

CCGAAGAGGA AGAAGGCAAG CACATCCACC TGGGCCACCT GCGCTTACAG AGGACACTGC 1860 

ACAGCAT CGA TCTGGAGATC CAAGAGGGTA AACTGGTTGG AATCTGCGGC AGTGTGGGAA 1920 

GTGGAAAAAC CTCTCTCATT TCAGCCATTT TAGGCCAGAT GACGCTTCTA GAGGGCAGCA 1980 

TTGCAATCAG TGGAACCTTC GCTTATGTGG CCCAGCAGGC CTGGATCCTC AATGCTACTC 2 040 

TGAGAGACAA CATCCTGTTT GGGAAGGAAT ATGATGAAGA AAGATACAAC TCTGTGCTGA 2100 

ACAGCTGCTG CCTGAGGCCT GACCTGGCCA TTCTTCCCAG CAGCGACCTG ACGGAGATTG 2160 

GAGAGCGAGG AGCCAACCTG AGCGGTGGGC AGCGCCAGAG GATCAGCCTT GCCCGGGCCT 222 0 

TGTATAGTGA CAGGAGCATC TACATCCTGG ACGACCCCCT CAGTGCCTTA GATGCCCATG 2280 

TGGGCAACCA CATCTTCAAT AGTGCTATCC GGAAACATCT CAAGT CCAAG ACAGTTCTGT 2340 

TTGTTACCCA CCAGTTACAG TACCTGGTTG ACTGTGATGA AGTGATCTTC ATGAAAGAGG 240 0 

GCTGTATTAC GGAAAGAGGC ACCCATGAGG AACTGATGAA TTTAAATGGT GACTATGCTA 24 60 

CCATTTTTAA TAACCTGTTG CTGGGAGAGA CACCGCCAGT TGAGATCAAT TCAAAAAAGG 252 0 

AAACCAGTGG TTCACAGAAG AAGT CACAAG ACAAGGGTCC TAAAACAGGA T CAGTAAAG A 2580 

AGGAAAAAGC AGTAAAGCCA GAGGAAGGGC AGCTTGTGCA GCTGGAAGAG AAAGGGCAGG 2 640 

GTTCAGTGCC CTGGTCAGTA TATGGTGTCT ACAT CCAGGC TGCTGGGGGC CCCTTGGCAT 2 700 

TCCTGGTTAT TATGGCCCTT TTCATGCTGA ATGTAGGCAG CACCGCCTTC AG CACCTGG T 2760 

GGTTGAGTTA CTGGATCAAG CAAGGAAGCG GGAACACCAC TGTGACTCGA GGGAACGAGA 2820 

CCTGGGTGAG TGACAGCATG AAGG ACAAT C CT CATATGC A GTACTATGCC AGCATCTACG 2880 

CCCTCTCCAT GGCAGTCATG CTGATCCTGA AAGCCATTCG AGGAGTTGTC TTTGTCAAGG 2 940 

GCACGCTGCG AGCTTCCTCC CGGCTGCATG ACGAGCTTTT CCGAAGGATC CTTCGAAGCC 3000 

CTATGAAGTT TTTTGACACG ACCCCCACAG GGAGGATTCT CAACAGGTTT TCCAAAGACA 30 60 

TGGATGAAGT TGACGTGCGG CTGCCGTTCC AGGCCGAGAT GTTCATCCAG AACGTTATCC 312 0 

TGGTGTTCTT CTGTGTGGGA ATGATCGCAG GAGTCTTCCC GTGGTTCCTT GTGGCAGTGG 3180 

GGCCCCTTGT CATCCTCTTT TCAGTCCTGC ACATTGTCTC CAGGGTCCTG ATTCGGGAGC 3240 

TGAAGCGTCT GGACAATATC ACGCAGTCAC CTTTCCTCTC CCACATCACG TCCAGCATAC 33 0 0 

AGGGCCTTGC CACCATCCAC GCCTACAATA AAGGGCAGGA GTTTCTGCAC AGATACCAGG 33 60 

AGCTGCTGGA TGACAACCAA GCTCCTTTTT TTTTGTTTAC GTGTGCGATG CGGTGGCTGG 342 0 

CTGTGCGGCT GGACCTCATC AGCATCGCCC TCATCACCAC CACGGGGCTG ATGATCGTTC 3480 

TTATGCACGG GCAGATTCCC CCAGCCTATG CGGGTCTCGC CATCTCTTAT GCTGTCCAGT 3540 

TAACGGGGCT GTTCCAGTTT ACGGT CAGAC TGGCATCTGA GACAGAAGCT CGATTCACCT 3 600 

CGGTGGAGAG GATCAATCAC TACATTAAGA CTCTGTCCTT GGAAGCACCT GCCAGAATTA 3 660 

AGAACAAGGC TCCCTCCCCT GACTGGCCCC AGGAGGGAGA GGTGACCTTT GAGAACGCAG 3 720 

AGATGAGGTA CCGAGAAAAC CTCCCTCTTG TCCTAAAGAA AGTATCCTTC ACGATCAAAC 3780 

CTAAAGAGAA GATTGGCATT GTGGGGCGGA CAGGATCAGG GAAGTCCTCG CTGGGGATGG 3840 

CCCTCTTCCG TCTGGTGGAG TTATCTGGAG GCTGCATCAA GATTGATGGA GTGAGAATCA 3 900 

GTGATATTGG CCTTGCCGAC CTCCGAAGCA AACTCTCTAT CATTCCTCAA GAGCCGGTGC 3 960 

TGTTCAGTGG CACTGTCAGA TCAAATTTGG ACCCCTTCAA CCAGTACACT GAAGACCAGA 402 0 

TTTGGGATGC CCTG GAGAGG ACACACATGA AAGAATGTAT TGCTCAGCTA CCTCTGAAAC 40 80 

TTGAATCTGA AGTGATGGAG AATGGGGATA ACTTCTCAGT GGGGGAACGG CAGCTCTTGT 4140 

GCATAGCTAG AGCCCTGCTC CGCCACTGTA AGATTCTGAT TTTAGATGAA GCCACAGCTG 4200 

CCATGGACAC AGAGACAGAC TTATTGATTC AAGAGACCAT CCGAGAAGCA TTTGCAGACT 42 60 

GTACCATGCT GACCATTGCC CATCGCCTGC ACACGGTTCT AGGCTCCGAT AGGATTATGG 432 0 

TGCTGGCCCA GGGACAGGTG GTGGAGTTTG ACACCCCATC GGTCCTTCTG TCCAACGACA 43 80 

GTTCCCGATT CTATGCCATG TTTGCTGCTG CAGAGAACAA GGTCGCTGTC AAGGGCTGAC 4440 

TCCTCCCTGT TGACGAAGTC TCTTTTCTTT AGAGCATTGC CATTCCCTGC CTGGGGCGGG 4500 

CCCCTCATCG CGTCCTCCTA CCGAAACCTT GCCTTTCTCG ATTTTATCTT TCGCACAGCA 4560 

GTTCCGGATT GGCTTGTGTG TTTCACTTTT AGGGAGAGTC ATATTTTGAT TATTGTATTT 4620 

ATTCCATATT CATGTAAACA AAATTTAGTT TTTGTTCTTA ATTGCACTCT AAAAGGTTCA 4680 

GGGAACCGTT ATTATAATTG TATCAGAGGC CTATAATGAA GCTTTATACG TGTAGCTATA 4740 

TCTATATATA ATTCTGTACA TAGCCTATAT TTACAGTGAA AATGTAAGCT GTTTATTTTA 4800 

TATTAAAATA AGCACTGTGC TAATAACAGT GCATATTCCT TTCTATCATT TTTGTACAGT 4860 

TTGCTGTACT AGAGATCTGG TTTTGCTATT AGACTGTAGG AAGAGTAGCA TTTCATTCTT 4920 

CTCTAGCTGG TGGTTTCACG GTGCCAGGTT TTCTGGGTGT CCAAAGGAAG ACGTGTGGCA 4980 

ATAGTGGGCC CTCCGACAGC CCCCTCTGCC GCCTCCCCAC AGCCGCTCCA GGGGTGGCTG 5040 

GAGACGGGTG GGCGGCTGGA GACCATGCAG AGCGCCGTGA GTTCTCAGGG CTCCTGCCTT 5100 

CTGTCCTGGT GTCACTTACT GTTTCTGTCA GGAGAGCAGC GGGGCGAAGC CCAGGCCCCT 5160 

TTTCACTCCC TCCATCAAGA ATGGGGATCA CAGAGACATT CCTCCGAGCC GGGGAGTTTC 5220 

TTTCCTGCCT TCTTCTTTTT GCTGTTGTTT CTAAACAAGA ATCAGTCTAT CCACAGAGAG 5280 

TCCCACTGCC TCAGGTTCCT ATGGCTGGCC ACTGCACAGA GCTCTCCAGC TCCAAGACCT 5340 

GTTGGTTCCA AGCCCTGGAG CCAACTGCTG CTTTTTGAGG TGGCACTTTT TCATTTGCCT 5400 

ATTCCCACAC CTCCACAGTT CAGTGGCAGG GCTCAGGATT TCGTGGGTCT GTTTTCCTTT 5460 

CTCACCGCAG TCGTCGCACA GTCTCTCTCT CTCTCTCCCC TCAAAGTCTG CAACTTTAAG 5520 

CAGCTCTTGC TAATCAGTGT CTCACACTGG CGTAGAAGTT TTTGTACTGT AAAGAGACCT 5580 

ACCTCAGGTT GCTGGTTGCT GTGTGGTTTG GTGTGTTCCC GCAAACCCCC TTTGTGCTGT 5640 

GGGGCTGGTA GCTCAGGTGG GCGTGGT CAC TGCTGTCATC AGTTGAATGG TCAGCGTTGC 5700 



305 



WO 02/086443 

ATGTCGTGAC CAACTAGACA TTCTGTCGCC 
CAAAAATCTG AAAATGTGAA TAAAATTATT 
AAAAAAAAAA AAAAAAAA 



TTAGCATGTT TGCTGAACAC CTTGTGGAAG 
TTGGATTTTG TAAAAAAAAA AAAAAAAAAA 



Seq ID NO: 319 Protein sequence: 
Protein Accession #: NP_005679 

1 11 21 

I I I 

MKDIDIGKEY IIPSPGYRSV RERTSTSGTH 
LDASMHSQLR I LDEEHPKGK YHHGLSALKP 
VAHKKGELSM EDVWSLSKHE SSDVNCRRLE 
LSIVCLMITQ LAGFSGPAFM VKHLLEYTQA 
ALNYRTGVRL RGAI LTMAFK KILKLKNIKE 
PWAILGMIY NVIILGPTGF LGSAVFILFY 
VLTYIKFIKM YAWVKAFSQS VQKIREEERR 
HMTLGFDLTA AQAFTWTVF NSMTFALKVT 
NKPASPHIKI EMKNATLAWD SSHSSIQNSP 
VLAEQKGHLL LDSDERPSPE EEEGKHIHLG 
KTSLISAILG QMTLLEGSIA ISGTFAYVAQ 
CCLRPDLAIL PSSDLTEIGE RGANLSGGQR 
NHIFNSAIRK HLKSKTVLFV THQLQYLVDC 
FNNLLLGETP PVEINSKKET SGSQKKSQDK 
VPWSVYGVYI QAAGGPLAFL VIMALFMLNV 
VSDSMKDNPH MQYYASIYAL SMAVMLILKA 
KFFDTTPTGR I LNRFSKDMD EVDVRLPFQA 
LVILFSVLHI VSRVLIRELK RLDNITQSPF 
LDDNQAPFFL FTCAMRWLAV RLDLISIALI 
GLFQFTVRLA SETEARFTSV ERINHYIKTL 
RYRENLPLVL KKVSFTIKPK EKIGIVGRTG 
IGLADLRSKL SIIPQEPVLF SGTVRSNLDP 
SEVMENGDNF SVGERQLLCI ARALLRHCKI 
MLTIAHRLHT VLGSDRIMVL AQGQWEFDT 



31 41 51 

1 I I 

RDREDSKFRR TRPLECQDAXj ETAARAEGLS 

IRTTSKHQHP VDNAGLFSCM TFSWLSSLAR 

RLWQEELNEV GPDAASLRRV VWIFCRTRLI 

TESNLQYSLL LVLGLLLTEI VRSWSLALTW 

KSLGELINIC SNDGQRMFEA AAVGSLLAGG 

PAMMFASRLT AYFRRKCVAA TDERVQKMNE 

I LEKAGYFQG ITVGVAPIW VIASWTFSV 

PFSVKSLSEA SVAVDRFKSL FLMEEVHMIK 

KLTPKMKKDK RASRGKKEKV RQLQRTEHQA 

HLRLQRTLHS IDLEIQEGKL VGICGSVGSG 

QAW I LNATLR DNILFGKEYD EERYNSVLNS 

QRISLARALY SDRSIYILDD PLSALDAHVG 

DEVIFMKEGC ITERGTHEEL MNIiNGD YAT I 

GPKTGSVKKE KAVKPEEGQL VQLEEKGQGS 

GSTAFSTWWL SYWIKQGSGN TTVTRGNETS 

IRGWFVKGT LRASSRLHDE LFRRILRSPM 

EMFIQNVILV FFCVGMIAGV FPWFLVAVGP 

LSHITSSIQG L AT I HAYNKG QEFLHRYQEL 

TTTGLMIVLM HGQIPPAYAG LAISYAVQLT 

SLEAPARIKN KAPSPDWPQE GEVTFENAEM 

SGKSSLGMAL FRLVELSGGC IKIDGVRISD 

FNQYTEDQIW DALERTHMKE CIAQLPLKLE 

LILDEATAAM DTETDLLIQE TIREAFADCT 

PSVLLSNDSS RFYAMFAAAE NKVAVKG 



Seq ID NO: 32 0 DNA sequence 

Nucleic Acid Accession #: AK022089.1 

Coding sequence: 181-1488 

1 11 21 31 41 51 

1 I I 1 I 1 

AGCAGTTGCA CAACTTCCAG CAACTTTCTC AGCCGGCTAC TAATGAGCTG AAAGCCAGGA 

ACATCCGAGG AGAAGAGAAA GCTTCCAGCC CTCCTCCCTT CACCCTGGAA ATCCAGACAC 

CCCCACCCCC ACCCTCAGAT CACTTTAAGA TAATTTCTTT ATTCGTTTGC CCGACAGACC 

ATGGCTCCCT TTGGAAGAAA CTTGCTAAAG ACTCGGCATA AAAACAGATC TCCAACTAAA 

GACATGGATT CAGAAGAGAA GGAAATTGTG GTTTGGGTTT GCCAAGAAGA GAAGCTTGTC 

TGTGGGCTGA CTAAACGCAC CACCTCTGCT GATGTCATCC AGGCTTTGCT TGAGGAACAT 

GAGGCTACGT TTGGAGAGAA ACGATTTCTT CTGGGGAAGC CCAGTGATTA CTGCAT CAT A 

GAGAAGTGGA GAGGCTCCGA AAGGGTTCTT CCTCCACTAA CTAGAATCCT GAAGCTTTGG 

AAAGCGTGGG GAGATGAGCA GCCCAATATG CAATTTGTTT TGGTTAAAGC AGATGCTTTT 

CTTCCAGTTC CTTTGTGGCG GACAGCTGAA GCCAAATTAG TGCAAAACAC AGAAAAATTG 

TGGGAGCTCA GCCCAGCAAA CTACATGAAG ACTTTACCAC CAGATAAACA AAAAAGAATA 

GTCAGGAAAA CTTTCCGGAA ACTGGCTAAA ATTAAGCAGG ACACAGTTTC TCATGAT CG A 

GATAATATGG AGACATTAGT TCATCTGATC ATTTCCCAGG ACCATACTAT TCATCAGCAA 

GTCAAGAGAA TGAAAGAGCT GGATCTGGAA ATTGAAAAGT GTGAAGCTAA GTTCCATCTT 

GATCGAGTAG AAAATGATGG AGAAAACTAT GTT CAGGATG CATATTTAAT GCCCAGTTTC 

AGTGAAGTTG AGCAAAATCT AGACTTGCAG TATGAGGAAA ACCAGACTCT GGAGGACCTG 

AG CGAAAGTG ATGGAATTGA ACAGCTGGAA GAACGACTGA AATATTACCG AATACTCATT 

GATAAGCTCT CTGCTGAAAT AGAAAAAGAG GTAAAAAGTG TTTGCATTGA TATAAATGAA 

GATGCGGAAG GGGAAGCTGC AAGTGAACTG GAAAGCTCTA ATTTAGAGAG TGTTAAGTGT 

GAT TTG GAGA AAAGCATGAA AGCTGGTTTG AAAATTCACT CTCATTTGAG TGGCATCCAG 

AAAGAGATTA AATACAGTGA CTCATTGCTT CAGATGAAAG CAAAAGAATA TGAACTCCTG 

GCCAAGGAAT TCAATTCACT TCACATTAGC AACAAAGATG GGTGCCAGTT AAAGGAAAAC 

AGAGCGAAGG AATCTGAGGT TCCCAGTAGC AATGGGGAGA TTCCTCCCTT TACTCAAAGA 

GTATTTAGCA ATTACACAAA TGACACAGAC TCGGACACTG GTATCAGTTC TAACCACAGT 

CAGGACTCCG AAACAACAGT AGGAGATGTG GTGCTGTTGT CAACATAGTT CCAATGGCTC 

CTTTCTGACC TGCTTT CATG TTTTAATGTT TGTTTAATTT AATAGGAAAC CTCATTTTAA 

ATATAACACT CAAAAAAATG TAAATCATAT TGTAGT ATT C AATAGTTAAT AAAAACTCGA 

GAAATGTGTT GTTTCTG 

Seq ID NO: 3 21 Protein sequence: 
Protein Accession #: NP_005438.1 

1 11 21 31 41 51 

I I I I I I 

MAP FGRNLLK TRHKNRSPTK DMDSEEKEIV VWVCQEEKLV CGLTKRTTSA DVIQALLEEH 

EATFGEKRFL LGKPSDYCII EKWRGSERVL PPLTRILKLW KAWGDEQPNM QFVLVKADAF 

LPVPLWRTAE AKLVQNTEKL WELSPANYMK TLPPDKQKRI VRKTFRKIiAK IKQDTVSHDR 

DNMETLVHIi I ISQDHTIHQQ VKRMKELDLE I EKCEAKFHL DRVENDGENY VQDAYLMPSF 

SEVEQNIiDLQ YEENQTLEDL SESDGIEQLE ERLKYYRILI DKLSAEIEKE VKSVCIDINE 

DAEGEAASEL ESSNLESVKC DLEKSMKAGL KIHSHLSGIQ KEIKYSDSLL QMKAKEYELL 

AKEFNSLHIS NKDGCQLKEN RAKES EVP SS NGEIPPFTQR VFSNYTNDTD SDTGISSNHS 

QDSETTVGDV VLLST 

Seq ID NO: 322 DNA sequence 

Nucleic Acid Accession #: NM_030920.1 



306 



WO 02/086443 

Coding sequence: 317-1123 
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21 



I 



1 



AGCATTGAAG 
GGCGCGTGCG 
AGTTAGAGTC 
CTGGTGGTGG 
AAAATTTTGG 
AGAGCAAGAG 
CCCGGAGGAG 
AGGCCTGAAT 
TTCGCTGGCC 
AATTTCTGGA 
GAGTGGAAAC 
GAAAAGTCTT 
TTTTGAACTA 
GCCGGACTCT 
AAATGAAGCT 
TGAGGATGAG 
AGTGGGCCTC 
TGTTGAAGAA 
GAAACGAGAT 
TTCTCTAATG 
AGCTATCCCT 
TTGCCTTATC 
ATTTTCATTG 
TTCAAGCTTA 
GGTGTAGTAT 
AATATAAAAT 
GGAATCTTTA 
TTTGGTTGCT 
TTCAGCAACA 
TAGTGGTGAC 
CATGCAGGTG 
GTTTTTAGGT 
GTTTCACTCC 
CTTTAGTCTT 
AAGAAATTGA 
TCTCCTTACC 
AAAGAAAAGC 
GCCTGTTGAT 
TTGGATACCA 
TAATAGCATT 
TTAAAATTAA 
AGTGAGTGTG 
CTCCTCTTTT 
TAAAATTTTT 
TTAATTGAAG 
TACTGCTTCT 
CTTGTGGAGA 
TAGTGAGGGG 
ATTCCCTGTT 
ATTTTTAAAA 
ATTAGAGTAC 
TTAGCTTTGT 
AGTTTTCGGT 
CTCAAGAATC 
AG CCATG ACA 



GGGAAGGAAC 
TGCGTGTGTG 
CCAACTCTTG 
TAGTGGGCGT 
GTTGGGGGTA 
GAGGACATGG 
GTGACAGAGT 
GATACTTTCA 
CGGCTTCCCA 
GGCTTGGAAG 
AAAATAAAAG 
GACCTGTTTA 
CTGCAGCAAA 
GAAGAGGAGG 
GGTCCACCGG 
GATGAAGATG 
TCATACTTAA 
GGGGAAGAAG 
GCTGAAGACG 
TTTCTGGGTG 
ACAGAAGATA 
ATTCCAAATA 
ACTCCCATTG 
CTGTATTAGT 
GGTGCATTTC 
GACAATAGTC 
GTTTGAAGGC 
TTTTTGTCAC 
TAGTTCATGG 
TGATAAGATT 
AGCCCTTTTG 
GTGCATTCTT 
CTCCCGCTCT 
ATACCTCAAC 
GTATTTTCTG 
ATAAATGTTT 
AGGGGTGCTT 
ATATTAATAA 
CTCTGCAAAG 
TAATTGGAAT 
GATTTGTTTT 
TGTTTCCTTA 
GCTATGGAGG 
TCCCTTTGTT 
TTATGCTTCT 
ACAATGTAAA 
AACTAAAAAT 
ATTGGAATCC 
CTAGTTCCTA 
TGAAATCTAT 
TTTGGTTTGA 
GGGTGGTATT 
CCTATTTTAA 
TCCTTAAAAA 
GTGTTAAAAA 



TGCGGGTGTG 
TGCGCGCGCT 
GACTCCATTT 
TTATATTTGC 
TTGGGGAAGG 
AGATGAAGAA 
TAGTCCTTGA 
AAGAACTAGA 
GCTTAAATAA 
TCCTGGCAGA 
ATCTCAGTAC 
ACTGTGAGAT 
TCACATACTT 
ATGATGAGGA 
AAGGATATGA 
AAGATGAAGC 
TGAAAGAAGA 
AGGAAGAAGA 
ATGGAGAGGA 
TGCAATAGAG 
ATGTGTAACT 
AGAACTAGTC 
TGGAATTCCC 
CATTTTTAGC 
ATTCCTTATT 
TCTTGAGTGG 
AGTTACCTTT 
AAGTAACTTG 
ATTTTGTGGA 
TTATTTTTGA 
TCAGGCTGCA 
TTTCTTCTTA 
CTCAAAAGGA 
TACGTTTCAG 
ACATAAGAAT 
CTTGGTTGAC 
TTGGAAGCAG 
GACATTAAAG 
TATTTCTAAC 
ATACTAGGCA 
CAAGTGGATG 
CATGGCTACT 
CTCCATGTTC 
TTGAATATTT 
ATACTGGGAC 
ATGTATGACT 
GTTGTACAAC 
CCAAAAAGAT 
ACAATTCTCA 
ATATTGACTT 
AAACAACACT 
TTCATGCAAA 
TGCTCTTTGT 
CTTTGAAGTT 
CAAAC 



31 
I 

GTGTGTGTAT 

AGTGTGTGGA 

GCTATTCTCT 

GTTCCTTTTC 

CAGGAAAGGG 

GAAGATTAAC 

TAATTGCCTG 
ATTTCTGAGT 

ACTTCGAAAA 
GAAATGT CC A 
AGTAGAAGCT 
CACAAACCTG 
AGATGGATTT 
TGGAGATGAA 
GGAAGAGGAG 
AGGTT CAGAG 
AATT CAGGAT 
GGAAGAAGGA 
AGAAGATGAC 
TGATCACATC 
TTTTATAGGA 
TGTTAATGAT 
TAGCAATTTA 
CCATAATTAA 
TATAGATTAA 
TAAGTTGGTT 
TTTTTTTTTT 
GAAAATAGAA 
GGTTCTATTC 
AGGAAAAATT 
AATCATGACA 
GCAATTCCTT 
ACTTGGGAAA 
TCCTGTCTGG 
ATATTATCAA 
AACAT CTAAG 
TGTTAGTGTT 
TCAAATTTTA 
CTTTAATTCC 
GCTGGAAAAG 
TCCATTAAAA 
AAATAAAATA 
AAGGCAATGG 
GTAAGTTTTT 
ATATTTAAAT 
TGGTGTTTTA 
TGACCGAAAG 
AACATTTTTC 
TTACATACTA 
TCTTATCAAT 
TAGAGCCTCC 
TAAGTAAGGG 
ATGGCAGTAT 
AATACTTTTG 



41 
i 

GTGTGTGTGT 
CAAGGAGGTG 
TCTTTCTCCC 
ATTCATTTCT 
AAAAGGAGAG 
CTGGAGTTAA 
TGTGTCAATG 
ATGGCTAATG 
TTGGAGCTTA 
AATCTTACCT 
CTGCAAAAT C 
GAAGATTATA 
GATCAGGAGG 
GATGATGAAG 
GAGGAAGAGG 
TTGGGAGAGG 
GAAGAAGATG 
GGTCTTCGAG 
TAGATCATTC 
TTTGTTTCTT 
AAAGTGTGGT 
CATATTGTAT 
TTTAGACTTA 
AACATGATCA 
CTGAAATTAC 
ATTTTTTTAG 
TTTTTTTTTG 
GCAGAATAGT 
AGTAATATGG 
GCTTATACTA 
TGCCGATGGT 
TATGATCACC 
CTTGTGAAAC 
GTTTTAAATA 
TACAGTTTTA 
ACAATATTAG 
CCTCAAAAGT 
ATGTTGGCCT 
CAGTTTTAAA 
TATTTGAAAC 
GTAGAAAAAT 
TAATGAGTAT 
CTTTTTAAAT 
AAGAAGTTAG 
ACTGAGTATA 
AAGTAAAAAT 
AAAACCCTTG 
TTCTGCTTTT 
TGCCAGATTA 
CATCTTACTG 
AGATAACTTT 
TGGGTTTTAT 
GTATATATTG 
TGCAACTGTG 



51 
I 

ATGTGTGTGC 
GGGGCAGCTG 
CCACACCTAT 
AAATCTCTTA 
TAGTAGCTGA 
GGAACAGATC 
GGGAAATTGA 
TGGAACTAAG 
GTGATAATAT 
ACCTCAATCT 
TTAAAAATTT 
GAGAAAGTAT 
ATAATGAAGC 
AGGAAGAGGA 
AAGAGGAGGA 
GAGAAGAGGA 
ATGATGACTA 
GGGAGAAGAG 
TAAGACCAGA 
CATGTACGAT 
TTTACTATTT 
GTAGAGAAAA 
ATTTTTTAAA 
CTTTTAAACA 
AGTTTGCTAT 
AGGTGATCCA 
ACTAAGAGTG 
AAAGGTTCTA 
TTCATGGATT 
AGTCCAGAGA 
TGTTTATTTT 
TTCCCTTCTT 
CCAGGAAAAC 
AGTGAAGTAG 
TGCAGTAAGC 
TGGGATGAAG 
CGGAACAAT T 
CTCAAATGAT 
ACAGATATAA 
TAAATTGACA 
ATTTGGGATA 
ACAAGTATAT 
CTTGGCTATC 
TGTCAGCAAA 
GTACTGCTGC 
TATGATGTTA 
GGGATAAGTT 
AAAAACTGAA 
CAAAAT ACT T 
TGCAATCAAA 
TAAGACTTAT 
ATTTTGTAGA 
TGTTAAGTTC 
TTTTGAATAA 



Seq ID NO: 323 Protein sequence: 
Protein Accession #: NP 112182.1 



MEMKKKINLE 
PSLNKLRKLE 
FNCEITNLED 
PEGYEEEEEE 
EEEEEEEGGL 



11 
1 

LRNRSPEEVT 
LSDNIISGGL 
YRESIFELLQ 
EEEEDEDEDE 
RGEKRKRDAE 



31 



41 



51 



21 
I 

ELVLDNCLCV NGEIEGLNDT FKELEFLSMA NVELSSLARL 
EVLAEKCPNL TYLNLSGNKI KDLSTVEALQ NLKNLKSLDL 
QITYLDGFDQ EDNEAPDSEE EDDEDGDEDD EEEEENEAGP 
DEDEAGSELG EGEEEVGLSY LMKEEIQDEE DDDDYVEEGE 
DDGEEEDD 



Seq ID NO: 324 DNA sequence 
Nucleic Acid Accession #: NM_003812 
Coding sequence: 224. .2722 



85 



TCCTCTGCGT 
GCCCAGCCCC 
CCATGCGCGC 
GCTCTCGCCG 
CAGCTCGCGG 
ACGCGGCCCC 
GCTTCTCGTC 
GGCTGCTGCG 
GGCAGATGAA 
AATGCAGAAA 



11 
I 

CCCGCCCCGG 
GAGCCCCGCG 
CGAGCCGGCG 
GCCACACGGA 
CAGCCGCCCC 
GCCGGCTCGG 
CTTCTCCTGC 
CCCAGCGCTC 
GACAATACAT 
GAAATCACAC 



21 
I 

GAGTGGCTGC 
CCCCGTGCCC 
TGACCGGCTC 
GCGGCGCCCG 
TGGCGGGCTG 
TGCCTGCCAG 
TGCCTCCGCT 
CGCATTGGAA 
TGCAACAGAA 
TGCCTTCAAG 



31 

1 

GAGGCTAGGC 
CGAGCCCGGA 
CGCCCGCGGC 
GGAGCTATGA 
CAGCCTTGCC 
CGCCCCGGCC 
CGCCGCCTCG 
TGAAACTGCA 
TAGCAGCAGT 
ACTCATATAT 



41 
I 

GAGCCGGGAA 
GCCCCCTGCC 
CGCCCCGCAG 
GCCATGAAGC 
GGCGCTTCCT 
CGCACGCCGC 
TCCCGGCCCC 
GAAAAAAATT 
AATATCAGTT 
TACATCAACC 



51 
I 

AGGGGGCGCC 
CGCGGCGGCA 
CTAGCCCGGC 
CGCCCGGCAG 
GCGGCCCCCA 
CCTGCCGCCT 
GCGCCTGGGG 
TGGGAGTCCT 
ACAGCAATGC 
AAGACT CGG A 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3 060 
3120 
3180 
3240 



60 
120 
180 
240 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 



307 



10 



15 



20 



25 



30 
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40 



WO 02/086443 

AAGCCCTTAT CACGTTCTTG 
CCATCTGGCC CAGG CAAGCT 
CATACTGAAC AATGGTTTGT 
ACCACAGTAC TCTAAGGGTG 
AGACTCCAAG GTGGCTCTGT 
CTTCGTGTAT ATGATAGAGC 
ACATATAATC CAGAAAACCT 
GGAAAGAGGT GACCAGTGGC 
AGCAGTGAAT CCATCACGTG 
TAATGATCAC AAAACGTATA 
AAAGT CCGTG GTCAACCTTG 
CCTGGTGGCT GTAGAGACCT 
GCAGATGCTC CATGAGTTCT 
GCACCTCATC TCGCGGGTGA 
TGTCTGTTCT CGCACAAGAG 
ACAAGTATTA TCGCAGAGCC 
AAAGCCAAAA TGTGACTGCA 
GTCCCATTCT CGAAAATTTT 
AGGAGGTGGA GCCTGCCTTT 
AAATGGATAC GTGGAAGCTG 
ATTATGCTGT AAGAAATGTT 
TAACAATACC TCATGTCTTT 
GTGTGATATT ACTGAATATT 
GCAAGACGGA TATGCATGCA 
CAGAGACAAC CAGTGTCAGT 
CTATGAAAAG CTGAATACAG 
GTGGATTCAG TGCAGCAAAC 
TCGAGCTCCA CGTATTGGTC 
AGGCCGGGTG ATTGACTGCA 
CTATGTAGAA GATGGAACGC 
ACAAATTCAA GCCCTAAATA 
GGGCCATGGG GTGTGTAGTA 
AGATTGCAGT ATCCGGGATC 
GGGTCCTAGT GCCACCAATC 
TATTGTCCTT GGGGGCACAG 
TACTCAGCAA GGCCCCATCT 
ATTCTGGGTA TGACATACTC 
CTTTGGGTGG TAATGACTAC 
CTGTCTCTTT TGGAAATAAT 
GGGGGCAAAA GACCATGCTA 
ACGAAGGAAC AACACACACA 



ACACAAAGGC 
TCCAGAT TGA 
TGTCTTCTGA 
GAGAGCACTG 
CAACCTGCAA 
CACTAGAGCT 
TGGCAGGACA 
CCTTTCTCTC 
GTATATTTGA 
AGAAGCATCG 
TGGATTCTAT 
GGACTGAGAA 
CAAAATACCG 
CATTTCACTA 
GAGTTGGTGT 
TGGCTCAAAA 
CAGAATCCTG 
CAAAGTGCAG 
TCAACAGGCC 
GGGAGGAGTG 
CCCTCTCCAA 
TTCAGCCACG 
GTACTGGAGA 
ATCAAAATCA 
ACAT CTGGGG 
AAGGCACTGA 
ATGATGTGTT 
AACTT CAGGG 
GTGGTGCCCA 
CATGTGGCCC 
TGAGCAGCTG 
ATGAAGCCAC 
CAGTTAGGAA 
TCATAATAGG 
GCTGGGGATT 
GAATCAGCTG 
GCAGCAGTGT 
GGAGCTAAAG 
GTCAAAGAAC 
TAAAAAGAAC 
CAAAAATTAA 



AAGACACCAG 
AGCCTTCGGC 
TTATGTGGAG 
TTACTACCAT 
TGGACTT CAT 
GGTTCATGAT 
GTATTCTAAG 
TGAATTACAG 
AGAAATGAAA 
CTCTTCTCAT 
TTACAAGGAG 
GGATCAGATT 
GCAGCGCATT 
TAAGAGAAGC 
GAATGAGTAT 
CCTTGGAATC 
GGGTGGCTGC 
CATTTTGGAG 
AACAAAGCTA 
TGATTGTGGT 
CGGGGCTCAC 
AGGGTATGAA 
CTCTGGTCAG 
GGGCCGCTGC 
AACAAAGGCT 
GAAGGGAAAC 
CTGTGGATTC 
TGAGATCATT 
TGTAGTTTTA 
GTCTATGATG 
TCCACTCGAT 
CTGCATTTGT 
CCTTCACCCC 
CTCCATCGCT 
TAAAAATGTC 
CGCTGGATGG 
TACTGGAACT 
TTGGGGTGAC 
ACCTTTCACC 
TGTTCCAGAA 
ATGCAATAAA 



CAAAAACATA 
TCCAAATTCA 
ATTCACTACG 
GGAAGCATCA 
GGCATGTTTG 
GAGAAAAGCA 
CAAATGAAGA 
TGGTTGAAAA 
TATTTGGAAC 
GCACATACCA 
CAGCTCAACA 
GACATCACCA 
AAGCAGCATG 
AGTCTGAGTT 
GGTCTTCCAA 
CAATGGGAAC 
AT CATGGAGG 
TATAGAGACT 
TTTGAGCCCA 
TTTCATGTGG 
TGCAGCGACG 
TGCCGGGATG 
TGCCCACCAA 
TACAATGGCG 
GCAGGGTCTG 
TGCGGGAAGG 
TTACTCTGTA 
CCAACTTCCT 
GATGATGATA 
TGTTTAGATC 
TCCAAGGGTA 
GATTTCACCT 
CCCAAGGATG 
GGTGCCATCC 
AAGAAGAGAA 
ACACCGCCTT 
ATTAAGTTTG 
AAGGATGGGG 
ACCTGTCAGT 
TCTTTTTTTT 
GGAATCATTA 



ATAAGGCTGT 660 

TTCTTGACCT 72 0 

AAAATGGGAA 780 

GAGGCGTCAA 840 

AAGATGATAC 90 0 

CAGGTCGACC 960 

ATCTCACTAT 1020 

GAAGGAAGAG 10 80 

TTATGATTGT 1140 

ACAACTTTGC 12 00 

CCAGGGTTGT 12 60 

CCAACCCTGT 1320 

CTGATGCTGT 13 80 

ACTTTGGAGG 1440 

TGGCAGTGGC 1500 

CTTCTAGCAG 1560 

AAACAGGGGT 162 0 

TTTTACAGAG 1680 

CGGAATGTGG 1740 

AATGCTATGG 1800 

GGCCCTGCTG 1860 

CTGTGAACGA 192 0 

ATCTTCATAA 198 0 

AGTGCAAGAC 2040 

ACAAGTTCTG 210 0 

ATGGAGACCG 2160 

CCAATCTTAC 222 0 

TCTACCATCA 22 80 

CGGATGTGGG 2 3 40 

GGAAGTGCCT 2400 

AAGTCTGTTC 2460 

GGGCAGGGAC 2520 

AAGGACCCAA 2 580 

TGGTAGCAGC 2 640 

GGTTCGATCC 270 0 

GCACTGTTGG 2 760 

TAAACAAAAC 2 82 0 

TAAAAGAAAA 2 8 80 

AAACGGGGGA 2 940 

TCCCTAATGG 3000 
AAAA 
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45 



Seq ID NO: 325 Protein sequence: 
Protein Accession NP 003803 



50 



55 



60 



I 

MKPPGSSSRQ 
RPRAWGAAAP 
INQDSESPYH 
HYENGKPQYS 
KSTGRPHIIQ 
LtELMIVNDHK 
I TTNPVQMLH 
LPMAVAQVLS 
RDFLQRGGGA 
SDGPCCNNTS 
NGECKTRDNQ 
LCTNLTRAPR 
LDRKCLQIQA 
KDEGPKGPSA 



11 

I 

PPLAGCSLAG 
SAPHWNETAE 
VLDTKARHQQ 
KGGEHCYYHG 
KTLAGQYSKQ 
TYKKHRSSHA 
EFSKYRQRIK 
QSLAQNLGIQ 
CLFNRPTKLF 
CLFQPRGYEC 
CQYIWGTKAA 
IGQLQGEIIP 
LNMSSCPLDS 
TNLIIGSIAG 



21 
1 

ASCGPQRGPA 
KNLGVLADED 
KHNKAVHLAQ 
SIRGVKDSKV 
MKNLTMERGD 
HTNNFAKSW 
QHADAVHLIS 
WEPSSRKPKC 
EPTECGNGYV 
RDAVNECD I T 
GSDKFCYEKL 
TSFYHQGRVI 
KGKVCSGHGV 
AILVAAIVLG 



31 
I 

GSVPASAPAR 
NTLQQNSSSN 
ASFQIEAFGS 
AL S TCNGLHG 
OWPFLSELQW 
NLVDSIYKEQ 
RVTFHYKRSS 
DCTESWGGCI 
EAGEECDCGF 
EYCTGDSGQC 
NTEGTEKGNC 
DCSGAHWLD 
CSNEATCICD 
GTGWGFKNVK 



41 
I 

TPPCRLLLVL 
ISYSNAMQKE 
KFILDLILNN 
MFEDDTFVYM 
LKRRKRAVNP 
LNTRWLVAV 
LSYFGGVCSR 
MEETGVSHSR 
HVECYGLCCK 
PPNLHKQDGY 
GKDGDRWIQC 
DDTDVGYVED 
FTWAGTDCS I 
KRRFDPTQQG 



51 

! 

LLLPPLAASS 60 

ITLPSRLIYY 12 0 

GLLSSDYVEI 180 

IEPLELVHDE 240 

SRGIFEEMKY 3 00 

ETWTEKDQID 3 60 

TRGVGVNEYG 42 0 

KFSKCSIIiEY 480 

KCSLSNGAHC 540 

ACNQNQGRCY 60 0 

SKHDVFCGFIj 660 

GTPCGPSMMC 72 0 

RDPVRNLHPP 780 
PI 



65 



Seq ID NO: 326 DNA sequence 

Nucleic Acid Accession #: AK074418.1 

Coding sequence: 244-1515 



70 



75 



80 



85 



CTTTCTCCAA 
ACCTGAGAGC 
AACAGATGGA 
AAATGACAGA 
GTCATGGCGT 
GACTTTACCA 
TTCCCCGCAG 
GTGATATGGA 
ATAAGCAGAT 
GGATCCTTGA 
CACCAGTATG 
GTGATTGATG 
CAAAACCAAG 
TATTCCGATC 
ATCACCAACA 
ACCAAGGCAG 
GCGATGGAGA 
CAATACCGAA 
ACCGAATGGA 



11 
I 

GACGGCCGGC 
CTGTGGAACC 
AAAAGTGAGG 
GCTGGAGTTC 
ATTACCAGGA 
CCTTGCGGGA 
CAGATTCTTC 
AGCGGCCACA 
TTGACATCCA 
CTCAGAACCC 
CTGGCATTTT 
ACCGCCTACC 
AGTTCTGGCC 
TGCACTATGG 
TCCATCTGCA 
GCTCCCTGAT 
ATGGGCTGGT 
GGGGCTGGGA 
GAGGGCGCTG 



21 
I 

CATGCTCTCC 
TGCCCGTCTC 
GACCGGTGAG 
TGCTGTGCCT 
GCCTTCAGTG 
TCACTGCCTG 
CATAGGCCAG 
GGATCTACCA 
ACAAGGAGGC 
ACAGTACAGG 
CCGTTTCCGG 
TGTCCAGGGA 
CTGCCTGCTG 
CTTCCTCGAG 
CTCTTCCCCT 
AACCTGTGCC 
GAGTCTCCAT 
AGAAATTATC 
GAGTGATGGG 



31 
I 

TCCTCTGCCA 
CCCTCCTCCA 
TGACTTGCTG 
GGAAAGGACC 
GAGACCTCCA 
AGCATGGGCC 
AAGCTGCTCC 
GGGGGTCCTC 
GCAGCTGACT 
CAGAAGATCC 
TTCTGGCAAT 
GATAAATGCC 
GAGAAGGCCT 
GATGCCCTGG 
GTGGACCTGG 
ACTCCAAGTG 
GCCTACACTG 
TCCCTGTGGA 
TCTCAGGAGT 



41 

I 

GTCTCCTCCA 
TCAGACACAC 
CTAAAGTTTA 
TCGGAAGTCT 
TCATCAAGTT 
GGACGTTTAA 
AGGAAAAACG 
CTCACTTCAT 
GCTGGTTCCT 
TGATGGT CCA 
GTGGCCAGTG 
TCTTTGTGCG 
ATGCCAAGCT 
TGGACCTCAC 
TGAAGGCAGT 
GGCCAACAGA 
TGACTGGGGC 
ACCCCTGGGG 
GGGAGGAAAC 



51 
I 

CCACTCTCTA 60 

CTGCCTAGGA 120 

TACCAGATGC 180 

TCTAAGGAGA 240 

CAAAG AC C AG 3 00 

GGATGAGACA 360 

CCTCTCCAAT 420 

CCTGGATGAT 480 

GGCAGCACTG 540 

AAGCTTTTCA 600 

GGTGGAAGTG 660 

TCCTCGCCAC 72 0 

GCTCGGATCC 780 

AGGAGGCGTG 840 

GAAGACAGCG 900 

T ACAG C AC AG 960 

TGAGCAGATT 102 0 

CTGGGG CG AG 1080 

CTGTGATCCG 1140 



308 



10 



15 



20 



WO 02/086443 

CGGAAAAGCC AGCTACATAA 
TTCCAACAGA AATTCATCGC 
GGAAACACAC TCCACGAAGG 
AACACTGCAG GAGGACCTCG 
GAAGGCACCA ATGTTGTCGT 
GAAGATGCAA AATTTCCACT 
CCAAAGCTCA AATAATAAAT 
GAACTATGTT GTGGTTGCAC 
CCTGAAAATG CCAGACAGTG 
AAGCCCTTCA GAACATGGCT 
GTACCTAGCA CCCAGGGGCC 
CCCTCACAGG CCCTTACTGG 
GCCTCTCTTC CTGGATCGTC 
CGCCCCACCC AGTCTCATCC 
GGATAATTAT GGGGTGTGAG 
ACCCCGTGAA ACCTTTCCTT 
CCCGGGAGCT AGCCAGCTTC 
TGCACACAGG ATTTCCTTAA 
GAATAAAATA GCTGCCAGGG 
AAAAAAAAAA AAAAAAAAAA 



GAAACGGGAA 

CATGTTTATA 

ATGGTCCCAA 

GAATGATGCT 

GTGCGTCACA 

CGATTTCCAA 

TCCGCCGCAA 

AGACACGGAG 

ACAGGCACCT 

CCCAACAAAG 

TTACGTGGGA 

GATGCAGAGA 

TCCAGAACTG 

GGGGGACTTC 

GTGCATTGCC 

CTCCTACTCG- 

AGAAAGCACA 

TGGCTTAATA 

GCTCTGCACA 

AAAAAAAAAA 



GATGGCGAGT 
TGTAGCGAAA 
ATAATGTTTA 
CAATTCAACT 
GTTGCTGTCA 
GTGATTCTGG 
CTTCACCATG 
AAAATCAGCG 
GAGCAGCCAT 
CATTTTCAAC 
TTGGAGAAAG 
GGAGAAGTGA 
CTGTGGCTGC 
AAGCTGGAAT 
CTCTAAATCT 
GCCACCTCCC 
TACAGCATCC 
AACTGTTATA 
ATGAGCCTCT 



TTTGGATGTC 
TT CCAATT AC 
GGAAG CAAGT 
TCTCTGTGCA 
CACCATCAAA 
CTGGCTCACA 
ACTTACCATC 
GAGTTCTTGC 
TTCAACCTCA 
AGATATGCTC 
GGGACCTGAG 
CTTGATGGAC 
CAAGCTCGGT 
GCAGAGCTTA 
TTAAACAAGC 
ACCAACCTGG 
TTGCTGCCAA 
AAGAACTCCT 
TACCGTTAAA 



GTGTCAAGAT 12 00 

CCTGGACCAT 12 60 

GATTCTAGGA 1320 

AG AGCCAATG 13 80 

TTTGAAAGCA 1440 

GAAACACTGT 1500 

TGAGCCCTGG 15 60 

TCCGAAT CTT 1620 

GAATGAAGGG 1680 

AGCAGGT ATG 1740 

GGAGGGACAG 1800 

TATTTTACCT 1860 

AGAGACGTGG 1920 

GAAAGGGAGG 1980 

AATTGGCAGT 2040 

CATCGTTCCT 2100 

ACCACCTATG 2160 

TGACTTGTCA 2220 

AAAAAAAAAA 22 8 0 
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Seq ID NO: 327 Protein sequence: 
Protein Accession #: BAB85075.1 



35 



1 

MAYYQEPSVE 
IWKRPQDLPG 
QYAGIFRFRF 
SDIiHYGFLED 
MENGLVSLHA 
KSQLHKKRED 
TAGGPRNDAQ 
KLK 



11 
I 

TSIIKFKDQD 
GPPHFILDDI 
WQCGQWVEW 
ALVDLjTGGVI 
YTVTGAEQIQ 
GEFWMSCQDF 
FNFSVQEPME 



21 
I 

FTTLRDHCLS 
SRFDIQQGGA 
IDDRLPVQGD 
TNIHLHSSPV 
YRRGWEEIIS 
QQKFIAMFIC 
GTNWVCVTV 



31 

I 

MGRTFKDETF 
ADCWFLAALG 
KCLFVRPRHQ 
DLVKAVKTAT 
LWNPWGWGET 
SEIPITLDHG 
AVTPSNLKAE 



41 

1 

PAADSSIGQK 
SLTQNPQYRQ 
NQEFWPCLLE 
KAGSLITCAT 
EWRGRWSDGS 
NTLHEGWSQI 
DAKFPLDFQV 



51 

I 

IiLQEKRIiSNV 60 

KILMVQSFSH 120 

KAYAKLLGSY 180 

PSGPTDTAQA 240 

QEWEETCDPR 3 00 

MFRKQVILGN 360 

ILAGSQKHCP 42 0 



40 



Seq ID NO: 328 DNA sequence 

Nucleic Acid Accession #t BC017490.1 

Coding sequence: 74-2788 



45 



50 



55 



60 



65 



70 



75 



80 



85 



GTGGGTCACG 
TCGTGGTACT 
GCGTCGGCGA 
TGCCCTCACC 
CCTAGGCACA 
CATGGAAAGG 
TCTGGATGAT 
CATGCGGCAG 
GTATGACAGC 
GGCCACGGAG 
TCTCAAAGGC 
CCACCGCTTC 
GGAGCGCATC 
CTTGGCAGCC 
GCAGATCTTT 
CATCACCAAC 
GCTGAGGCAG 
TGGCGTCCTG 
GGGTCCTTTC 
GTCGGCCGGC 
CCGAATCCAG 
CATTCTCCTC 
CATCTATCAC 
C ACTGT CATC 
GACCGATGAA 
GATCTTTGCC 
TCTGGCCCTG 
TATCAACGTG 
TGAGAAAGTG 
CACGGCGTAT 
GGTTCTGGCT 
CAGAACCAGC 
CGTCACCTCC 
CTACGACCCC 
CTTTGACAT C 
CCGCTTCGTG 
GGCCAATGGC 
CCAGGAGGTC 
CCAGATGGAC 
GACAGGCAGC 
CCACGCGCGC 
CGTGATGCTG 
GACTTTTGCC 
GAAGCAGTTA 
CACTATTGAG 



11 
I 

TGAACCACTT 

GCTATGGCGG 

GGCAATGATC 

TCCAGCCCTG 

GAGGGGCCCC 

GACTACCGCG 

GAGGACGTAG 

CGTGACCGGG 

GATGAGGAGG 

GACGGCGAGG 

CACTCTGTGC 

AAGAACTTCC 

AGCGACATGT 

AGGGAGCACG 

GATGAGGCTG 

CACATCCATG 

CTGCATCTGA 

CCCCAGCTCA 

TGCCAGTCCC 

CCCTTTGAGG 

GAGAGTCCAG 

GCAGATCTGG 

AACAACTATG 

CTAGCCAACC 

GATGTGAAGA 

AGCATTGCTC 1 

TTCGGAGGGG 

CTCTTGTGCG 

T CCAGCCG AG 

GTCCAGCGGC 

GACCGAGGAG 

ATCCATGAGG 

CTGCAGGCTC 

TCGCTGACTT 

CTGTGTGTGG 

GTGGGCAGCC 

AGCGCTGCTG 

CTGAAGAAGT 

CAGGACAAGG 

ATCCCCATTA 

ATCCATCTGC 

GAGAGCTTCA 

CGCTACCTTT 

GTGGCAGAGC 

GTCCCTGAGA 



21 
I 

TTCGCGCGAA 
AAT CATCGGA 
CTCTCACCTC 
GCCGTGACCT 
TGGAGGAAGA 
CCATCCCAGA 
AGGAGCTGAC 
AGGCTGGCCG 
ACGAGGAGCG 
AGGACGAGGA 
GCGAGTGGGT 
TGCGCACTCA 
GCAAAGAGAA 
TGCTGGCCTA 
CCCTGGAGGT 
TCCGCATCTC 
ACCAGCTGAT 
GCATGGTCAA 
AGAACCAGGA 
TCAACATGGA 
GCAAAGTGGC 
TGGACAGCTG 
ATGGCTCCCT 
ACGTGGCCAA 
TGATCACTAG 
CTTCCATCTA 
AG CCCAAAAA 
GAGACCCTGG 
CCATCTTCAC 
ACCCTGTCAG 
TGTGTCTCAT 
CCATGGAGCA 
GCTGCACGGT 
TCTCTGAGAA 
TGAGGGACAC 
ACGTCAGACA 
AGCCCGCCAT 
ACATCATCTA 
TGGCCAAGAT 
CGGTGCGGCA 
GGGACTATGT 
TAGACACACA 
CATTCCGGCG 
AGGTGACATA 
AGGACTTGGT 



31 
I 

ACCTGGTTGT 
ATCCTTCACC 
CAGCCCTGGC 
TCCACCATTT 
AGAGGATGGA 
GCTGGACGCC 
GG CCAGTCAG 
GGGCCTGGGC 
CCCTGCCCGC 
GATGATCGAG 
GAGCATGGCG 
CGTCGACAGC 
CCGTGAGAGC 
CTTCCTGCCT 
GGTACTGGCC 
CCACCTGCCT 
CCGCACCAGT 
GTACAACTGC 
GGTGAAACCA 
GGAGACCATC 
GGCTGGCCGG 
CAAGCCAGGA 
CAACACTGCC 
GAAGGACAAC 
CCTCTCCAAG 
TGGTCATGAA 
CCCAGGTGGC 
CACAGCGAAG 
CACTGGCCAG 
CAGGGAGTGG 
TGATGAATTT 
ACAGAGCATC 
CATTGCTGCC 
CGTGGACCTC 
CGTGGACCCA 
CCACCCCAGC 
GCCCAACACG 
CGCCAAGGAG 
GTACAGTGAC 
CATCGAGTCC 
GATCGAAGAC 
GAAGTTCAGC 
TGACAACAAT 
TCAGCGCAAC 
GGATAAGGCT 



41 
1 

TGCTGTAGTG 
ATGGCATCCA 
CGAAGCTCCC 
GAGGATGAGT 
GAGGAGCTCA 
TATGAGGCCG 
AGGGAGGCAG 
CGCATGCGCC 
AAGCGCCGCC 
AGCATCGAGA 
GGCCCCCGGC 
CACGGCCACA 
CTGGTGGTGA 
GAGGCACCGG 
ATGTACCCCA 
CTGGTGGAGG 
GGGGTGGTGA 
AACAAGTGCA 
GGCTCCTGTC 
TATCAGAACT 
CTGCCCCGCT 
GACGAGATAG 
AATGGCTTCC 
AAGGTTGCTG 
GATCAGCAGA 
GACATCAAGA 
AAGCACAAGG 
TCGCAGTTTC 
GGGGCGTCGG 
ACCTTGGAGG 
GACAAGATGA 
TCCATCTCGA 
GCCAACCCCA 
ACAGAGCCCA 
GTCCAGGACG 
AACAAGGAGG 
TATGGCGTGG 
AGGGTCCACC 
CTGAGGAAAG 
ATGATCCGCA 
GACGT CAACA 
GTCATGCGCA 
GAGCTGTTGC 
CGCTTTGGGG 
CGTCAGATCA 



51 
I 

GCGGAGAGGA 60 

GCCCGGCCCA 12 0 

GGCGTACTGA 180 

CCGAGGGGCT 24 0 

TTGGAGATGG 300 

AGGGACTGGC 360 

CAGAGCGGGC 42 0 

GTGGGCTCCT 48 0 

AGGTGGAGCG 540 

ACCTGGAGGA 600 

TGGAGAT CCA 660 

ACGTCTTCAA 720 

ACTATGAGGA 780 

CGGAGCTGCT 840 

AGTACGACCG 900 

AGCTGCGCTC 960 

CCAGCTGCAC 102 0 

ATTTCGTCCT 1080 

CTGAGTGCCA 1140 

ACCAG CGT AT 1200 

CCAAGGACGC 12 60 

AGCTGACTGG 1320 

CTGTCTTTGC 1380 

TAGGGGAACT 1440 

TCGGAGAGAA 1500 

GAGGCCTGGC 1560 

TACGTGGTGA 1620 

TCAAGTATAT 1680 

CTGTGGGCCT 1740 

CTGGGGCCCT 1800 

ATGACCAGGA 1860 

AGGCTGGCAT 192 0 

TAGGAGGGCG 1980 

TCATCTCACG 2040 

AGATGCTGGC 2100 

AGGAGGGGCT 2160 

AGCCCCTGCC 2220 

CGAAGCTCAA 2280 

AATCTATGGC 2 340 

TGGCGGAGGC 2400 

TGGCCATCCG 2460 

GCATGCGCAA 2 520 

TCTTCATACT 2580 

CCCAGCAGGA 2 640 

ACATCCACAA 2 700 
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CCTCTCTGCA TTTTATGACA 
AAGGAAAATG ATCCTGCAGC 
TTCTGGTTTG GGGTGGTCAG 
TGAACT CGGG GTACTAGGGT 
TGTTTGTTTC TCCAAGCCTG 
TGTCTTACTT GGTTGCTGAA 
TTGGATCAGA GCTGCTGAGT 
ATGGATGTCA GGAGAGCTGC 
TGCCTTTGGC CAGAGAGCTG 
TCTGTGCCCC TGTGGTGGAA 
GTCGCAGGGG TGGGATGTGA 
TTGCTCCCTG TCTGTTTCCC 
TAATTTTTAA TAAAGTTGAA 



GTGAGCTCTT 
AGTTCTGAGG 
TGCCCTCTGT 
CAGGGCTTAT 
CTTTGTGCTT 
CATCTTGCCA 
TCAGGATGCC 
TGCCCTCTTG 
GTTGAAGATG 
GAGGGCACGA 
GTCATGCGGA 
CACTCTCTTA 
TAAAATATAA 



CAGGATGAAC 
CCCTATGCCA 
GCTTTATGGA 
AGCAGGATGT 
CTCACCTTTG 
CCTCCGAGTG 
TGCGTGTGGT 
GCGTGAGTTG 
TTTGTAATCG 
CAGTGCCAGC 
TTATCCACTC 
TTTGTGCATT 
AAAAAAAAAA 



AAGTTCAGCC 
TCCATAAGGA 
CACAAAACCA 
CTGGCTGCAC 
GGTGGGATGC 
CTTTGTCTCC 
TTAGGTGTTA 
CGTATTCAGG 
TTTTCAGTCT 
GCAGCGTTCT 
GCCACAGTTA 
CGGTTTGGTT 
AAAAAA 



ACGACCTGAA 
TTCCTTGGGA 
GAGCACTTGA 
CTGGCATGAC 
CTTGCCAGTG 
ACTCAGTACC 
GCCTTCTTAC 
CTGCTTTTGC 
CCTGCAGGTT 
GGGCTCCTCA 
TCAGCTGCCA 
TCTGTAGTTT 



Seq ID NO: 329 Protein sequence: 
Protein Accession #: AAH17490.1 



11 



MAESSESFTM 
GPLEEEEDGE 
DREAGRGLGR 
SVREWVSMAG 
EHVLAYFLPE 
HLNQLIRTSG 
FEVNMEETIY 
NYDGSLNTAN 
IAPSIYGHED 
SRAIFTTGQG 
HEAMEQQSIS 
CWRDTVDPV 
KKYIIYAKER 
HLRDYVIEDD 
AEQVTYQRNR 
LQQF 



ASSPAQRRRG 
ELIGDGMERD 
MRRGLLYDSD 
PRIiEIHHRFK 
APAELLQIFD 
WTSCTGVLP 
QNYQRIRIQE 
GFPVFATVIL 
IKRGLALALF 
ASAVGLTAYV 
ISKAGIVTSL 
QDEMLARFW 
VHPKLNQMDQ 
VNMAIRVMLE 
FGAQQDTIEV 



21 
I 

NDPLTSSPGR 
YRAIPELDAY 
EEDEERPARK 
NFLRTHVDSH 
EAALEWLAM 
QLSMVKYNCN 
SPGKVAAGRL 
ANHVAKKDNK 
GGEPKNPGGK 
QRHPVSREWT 
QARCTVIAAA 
GSHVRHHPSN 
DKVAKMYSDL 
SFIDTQKFSV 
PEKDLVDKAR 



31 

] 

SSRRTDALTS 
EAEGLALDDE 
RRQVERATED 
GHNVFKERIS 
YPKYDRITNH 
KCNFVLGPFC 
PRSKDAILLA 
VAVGELTDED 
HKVRGDINVIj 
LEAGALVLAD 
NPIGGRYDPS 
KEEEGLANGS 
RKESMATGSI 
MRSMRKTFAR 
QINIHNLSAF 



41 
i 

SPGRDLPPFE 
DVEELTASQR 
GEEDEEMIES 
DMCKENRESL 
IHVRISHLPL 
QSQNQEVKPG 
DLVDSCKPGD 
VKMITSLSKD 
LCGDPGTAKS 
RGVCLIDEFD 
LTFSENVDLT 
AAEPAMPNTY 
PITVRHIESM 
YLSFRRDNNE 
YDSELFRMNK 



51 
I 

DESEGLLGTE 
EAAERAMRQR 
IENLEDLKGH 
WNYEDLAAR 
VEELRSLRQL 
SCPECQSAGP 
EIELTGIYHN 
QQIGEKIFAS 
QFLKYIEKVS 
KMNDQDRTSI 
EPIISRFDIL 
GVEPLPQEVL 
IRMAEAHARI 
LLLFIIiKQLV 
FSHDLKRKMI 



Seq ID NO: 330 DNA sequence 
Nucleic Acid Accession #: M17254 
Coding sequence: 2 57-1645 



85 



GTCCGCGCGT 
CGGGTCGCAC 
CTTTGGAGAC 
AAAGATGGCA 
TGGCTTACTG 
CTTATCAGTT 
GGCTAAGACA 
CCCACGCGTC 
GGAATGTAAC 
CAAAGGCGGG 
GGAGGAGAAG 
AGCAG AT CCT 
AGAATATGGC 
GTGCAAGATG 
TCTCTCACAT 
TGATAAAGCC 
TGAGCCCCCC 
TGCTCAACCA 
TTATCAGATT 
GCTTTGGCAG 
GGAAGGCACC 
AGAGCGGAAG 
CTATGACAAG 
CCACGGGATC 
CTCAGACCTC 
GCCCCACCCT 
CTGGAATTCA 
TTCTCATCTG 
CACCAGCCCA 
TGAAAAAAGC 
GAGGGAGTTA 
GGACATATCA 
AAGGACAAAG 
AATCCCACTA 
AACATACCGT 
TCAAAAACAA 
ACTGCATGGC 
CAGCTTTCTC 
ACTATGAACT 
AGGGGTGAAG 
TCTCAAGCAA 
ACTCGAGGGT 
GTAATGGAGA 
TGT CAAATGA 
TCATTATGTG 



11 
I 

GTCCGCGCCC 
TAACTCCCTC 
CCGAGGAAAG 
GAACCAAGGG 
AAGGACATGA 
GTGAGTGAGG 
GAGATGACCG 
CCTCAGCAGG 
CCTAGCCAGG 
AAGATGGTGG 
CACATGCCAC 
ACGCTATGGA 
CTTCCAGACG 
ACCAAGGACG 
CTCCACTACC 
TTACAAAACT 
AGGAGAT CAG 
TCTCCTTCCA 
CTTGGACCAA 
TTCCTCCTGG 
AACGGGGAGT 
AGCAAACCCA 
AACATCATGA 
GCCCAGGCCC 
CCGTACATGG 
CCAGCCCTCC 
CCAACTGGGG 
GGCACTTACT 
TCGCCAGAAA 
TTTACTGGGG 
CTGAAGTCTT 
TCTGTGGACT 
TGCCAAAGAA 
ATGCAAACTG 
TTATAATGCC 
GAGAAAAGAC 
ATGTGCTGTT 
AAACTGTGAA 
AAAAGGTGGG 
AAGGAGGAGG 
TGAAGACTGG 
TCATGCAGTC 
AAGGGAAGTA 
AAATTTTAAC 
GGGGCTTTGT 



21 
I 

GCGTGTGCCA 
GGCGCCGACG 
CCGTGT TGAC 
CAACTAAAGC 
TTCAGACTGT 
ACCAGTCGTT 
CGTCCTCCTC 
ATTGGCTGTC 
TGAATGGCTC 
GCAGCCCAGA 
CCCCAAACAT 
GTACAGACCA 
TCAACATCTT 
ACTTCCAGAG 
TCAGAGAGAC 
CTCCACGGTT 
CCTGGACCGG 
CAGTGCCCAA 
CAAGTAGCCG 
AGCTCCTGTC 
TCAAGATGAC 
ACATGAACTA 
CCAAGGTCCA 
TCCAGCCCCA 
GCTCCTATCA 
CCGTGACATC 
GTATATACCC 
ACTAAAGACC 
CTCTATCGGA 
CTGGGGAAGG 
ACTACAGAAA 
GACCTTGTAA 
AGTGGTCTTA 
GGATGAAACT 
ATTTTAAGGA 
ACGAGAGAGA 
TTGGTTGAAA 
GATGACCCAA 
ACTGAGGATG 
AAGAGGCAGA 
ACTCAGGACA 
AGTGTTATAC 
GTAGAATTCA 
TGGAATTGTC 
TCTCCACAGG 



31 
I 

GCGCGCGTGC 
GCGGCGCTAA 
CAAAAGCAAG 
CGTCAGGTTC 
CCCGGACCCA 
GTTTGAGTGT 
CAGCGACTAT 
TCAACCCCCA 
AAGGAACTCT 
CACCGTTGGG 
GACCACGAAC 
TGTGCGGCAG 
GTTATTCCAG 
GCTCACCCCC 
TCCTCTTCCA 
AATGCATGCT 
TCACGGCCAC 
AACTGAAGAC 
CCTTGCAAAT 
GGACAGCTCC 
GGATCCCGAC 
CGATAAGCTC 
TGGGAAGCGC 
CCCCCCGGAG 
CGCCCACCCA 
TTCCAGTTTT 
CAACACTAGG 
TGGCGGAGGC 
GAACATGAAT 
AAGCCGGGGA 
TGAGGAGGAT 
AAGACAGTGT 
AGAAATGTAT 
AAAGCAATAG 
AAACTACCTG 
CTGTGGCCCA 
TCAAATACAT 
AGTTTCCAAC 
TGTATAGAGT 
GAAGGAGGAG 
TTTGGGGACT 
CAAACCCAGT 
GAAACAAAAA 
TGATATTTAA 
GTCAGGTAAG 



41 
I 

CTTGGCCGTG 
CCTCTCGGTT 
ACAAATGACT 
TGAACAGCTG 
GCAGCT CAT A 
GCCTACGGAA 
GGACAGACTT 
GCCAGGGTCA 
CCTGATGAAT 
ATGAACTACG 
GAG CG CAG AG 
TGGCTGGAGT 
AACATCGATG 
AGCTACAACG 
CATTTGACTT 
AGAAACACAG 
CCCACGCCCC 
CAGCGTCCTC 
CCAGGCAGTG 
AACTCCAGCT 
GAGGTGGCCC 
AGCCGCGCCC 
TACGCCTACA 
TCATCTCTGT 
CAGAAGATGA 
TTTGCTGCCC 
CTCCCCACCA 
TTTTCCCATC 
CAAAAGTGCC 
AG AG AT C CAA 
GCTAAAAATG 
ATGTAGAAGC 
AAACTTTAGA 
AAACAACACA 
TATTTAAAAA 
TCAACAGACG 
TCCGTTTGAT 
TCCTTTACAG 
GAGCGTGTGA 
ACCAGGCTGG 
GTGTACAATG 
GTTAGGAGAA 
TG CG CAT CT C 
GAG AAACAT T 
AG AT GGCCT T 



51 

I 

CGCGCCGAGC 
ATTCCAGGAT 
CACAGAGAAA 
GTAGATGGGC 
TCAAGGAAGC 
CGCCACACCT 
C CAAG AT GAG 
CCATCAAAAT 
GCAGTGTGGC 
GCAGCTACAT 
TTATCGTGCC 
GGGCGGTGAA 
GGAAGGAACT 
CCGACATCCT 
CAGATGATGT 
ATTTACCATA 
AGTCGAAAGC 
AGTTAG AT CC 
GCCAGATCCA 
G CAT C AC CTG 
GGCGCTGGGG 
T CCGTT ACT A 
AGTTCGACTT 
ACAAGTACCC 
ACTTTGTGGC 
CAAACCCATA 
GCCATATGCC 
AGCGTGCATT 
TCAAGAGGAA 
AGACTCTTGG 
TCACGAATAT 
ATGAAGTCTT 
GTAGAGTTTG 
GTTTTGACCT 
TAGTTTCATA 
TTGATATGCA 
GGACAGCTGT 
TATTACCGGG 
TTGTAGACAG 
GAAAGAAACT 
AGTTATGGAG 
AGGACACAGC 
TTTCTTTGTT 
CAGGACCTCA 
CTTGGCTGCC 



2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
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60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 



310 



WO 02/086443 

ACAATCAGAA ATCACGCAGG CATTTTGGGT AGGCGGCCTC CAGTTTTCCT TTGAGTCGCG 2760 

AACGCTGTGC GTTTGTCAGA ATGAAGTATA CAAGTCAATG TTTTTCCCCC TTTTTATATA 2820 

ATAATTATAT AACTTATGCA TTTATACACT ACGAGTTGAT CTCGGCCAGC CAAAGACACA 2880 

CGACAAAAGA GACAATCGAT ATAATGTGGC CTTGAATTTT AACTCTGTAT GCTTAATGTT 2 940 

TACAATATGA AGTTATTAGT TCTTAGAATG CAGAATGTAT GTAATAAAAT AAGCTTGGCC 3000 

TAGCATGGCA AATCAGATTT ATACAGGAGT CTG CATTTGC ACTTTTTTTA GTGACTAAAG 3060 

TTGCTTAATG AAAACATGTG CTGAATGTTG TGGATTTTGT GTTATAATTT ACTTTGTCCA 312 0 
GGAACTTGTG CAAGGGAGAG CCAAGGAAAT AGGATGTTTG GCACCC 

Seq ID NO: 331 Protein sequence 
Protein Accession #j AAA52398 

1 11 21 31 41 51 

I I 1 1 I I 

MIQTVPDPAA HIKEALSWS EDQSLFECAY GTPHLAKTEM TASSSSDYGQ TSKMSPRVPQ 60 

QDWLSQPPAR VTIKMECNPS QVNGSRNSPD ECSVAKGGKM VGSPDTVGMN YGSYMEEKHM 120 

PPPNMTTNER RVIVPADPTL WSTDHVRQWL EWAVKEYGLP DVNILLFQNI DGKELCKMTK 180 

DDFQRLTPSY NADILLSHLH YLRETPLPHL TSDDVDKALQ NSPRLMHARN TDLPYEPPRR 240 

SAWTGHGHPT PQSKAAQPSP STVPKTEDQR PQLDPYQILG PTSSRLANPG SGQIQLWQFL 300 

LELLSDSSNS SCITWEGTNG EFKMTDPDEV ARRWGERKSK PNMNYDKLSR ALRY YYDKN I 360 

MTKVHGKRYA YKFDFHGIAQ ALQPHPPESS LYKYPSDLPY MGSYHAHPQK MNFVAPHPPA 420 

LPVTSSSFFA APNPYWNSPT GGIYPNTRLP TSHMPSHLGT YY 462 

Seq ID NO: 332 DNA sequence 
Nucleic Acid Accession #: NM_00002 0 
Coding sequence: 283-1794 

1 11 21 31 41 51 

I l l l l > 

AGGAAACGGT TTATTAGGAG GGAGTGGTGG AGCTGGGCCA GGCAGGAAGA CGCTGGAATA 60 

AGAAACATTT TTGCTCCAGC CCCCATCCCA GTCCCGGGAG GCTGCCGCGC CAGCTGCGCC 12 0 

GAGCGAGCCC CTCCCCGGCT CCAGCCCGGT CCGGGGCCGC GCCGGACCCC AGCCCGCCGT 180 

CCAGCG CTGG CGGTGCAACT GCGGCCGCGC GGTGGAGGGG AGGTGGCCCC GGTCCGCCGA 240 

AGGCTAGCGC CCCGCCACCC G C AG AG CGGG CCCAGAGGGA CCATGACCTT GGGCTCCCCC 300 

AGGAAAGGCC TTCTGATGCT GCTGATGGCC TTGGTGACCC AGGGAGACCC TGTGAAGCCG 3 60 

TCTCGGGGCC CGCTGGTGAC CTGCACGTGT GAGAGCCCAC ATTG CAAGGG GCCTACCTGC 420 

CGGGGGGCCT GGTGCACAGT AGTGCTGGTG CGGGAGGAGG GGAGGCACCC CCAGGAACAT 480 

CGGGGCTGCG GGAACTTGCA CAGGGAG CT C TGCAGGGGGC GCCCCACCGA GTT CGTCAAC 540 

CACTACTGCT GCGACAGCCA CCTCTGCAAC CACAACGTGT CCCTGGTGCT GGAGGCCACC 600 

CAACCTCCTT CGGAGCAGCC GGGAACAGAT GGCCAGCTGG CCCTGATCCT GGGCCCCGTG 660 

CTGGCCTTGC TGGCCCTGGT GGCCCTGGGT GTCCTGGGCC TGTGGCATGT CCGACGGAGG 72 0 

CAGGAGAAGC AGCGTGGCCT GCACAGCGAG CTGGGAGAGT CCAGTCTCAT CCTGAAAGCA 7 80 

TCTGAGCAGG GCGACACGAT GTTGGGGGAC CTCCTGGACA GTGACTGCAC CACAGGGAGT 840 

GGCTCAGGGC TCCCCTTCCT GGTGCAGAGG ACAGTGGCAC GGCAGGTTGC CTTGGTGGAG 900 

TGTGTGGGAA AAGGCCGCTA TGGCGAAGTG TGGCGGGGCT TGTGGCACGG TGAGAGTGTG 960 

GCCGTCAAGA TCTTCTCCTC GAGGGATGAA CAGTCCTGGT TCCGGGAGAC TGAGATCTAT 102 0 

AACACAGTAT TGCTCAGACA CGACAACATC CTAGGCTTCA TCGCCTCAGA CATGACCTCC 10 8 0 

CGCAACTCGA GCACGCAGCT GTGGCTCATC ACGCACTACC ACGAGCACGG CTCCCTCTAC 114 0 

GACTTTCTGC AGAGACAGAC GCTGGAGCCC CATCTGGCTC TGAGGCTAGC TGTGTCCGCG 12 0 0 

GCATGCGGCC TGGCGCACCT GCACGTGGAG ATCTTCGGTA CACAGGGCAA ACCAGCCATT 1260 

GCCCACCGCG ACTTCAAGAG CCGCAATGTG CTGGTCAAGA GCAACCTGCA GTGTTGCATC 132 0 

GCCGACCTGG GCCTGGCTGT GATGCACTCA CAGGGCAGCG ATTACCTGGA CATCGGCAAC 1380 

AACCCGAGAG TGGGCACCAA GCGGTACATG GCACCCGAGG TGCTGGACGA GCAGATCCGC 1440 

ACGGACTGCT TTGAGTCCTA CAAGTGGACT GACATCTGGG CCTTTGGCCT GGTGCTGTGG 1500 

GAGATTGCCC GCCGG AC CAT CGTGAATGGC AT CGTGGAGG ACTATAGACC ACCCTTCTAT 1560 

GATGTGGTGC CCAATGACCC CAGCTTTGAG GACATGAAGA AGGTGGTGTG TGTGGATCAG 162 0 

CAGACCCCCA CCATCCCTAA CCGGCTGGCT GCAGACCCGG TCCTCTCAGG CCTAGCTCAG 1680 

ATGATGCGGG AGTGCTGGTA CCCAAACCCC TCTGCCCGAC TCACCGCGCT GCGGATCAAG 1740 

AAGACACTAC AAAAAATTAG CAACAGTCCA GAGAAGCCTA AAGTGATTCA ATAGCCCAGG 1800 

AGCACCTGAT TCCTTTCTGC CTGCAGGGGG CTGGGGGGGT GGGGGGCAGT GGATGGTGCC 1860 

CTATCTGGGT AGAGGTAGTG TGAGTGTGGT GTGTGCTGGG GATGGGCAGC TGCGCCTGCC 192 0 

TGCTCGGCCC CCAGCCCACC CAGCCAAAAA TACAGCTGGG CTGAAACCTG ATCCCCTGCT 1980 

GTCTGGCCTG CTCAAAGCGG CAGGCTCCCT GACGCCTGGC TCTCTCCCCA CCCCTATGGC 2 040 

CAGCATGGTG CACCCCCTAC CACTCCCGGG ACAGGATGCA AAAGAGGCTC CAGAGTCAGA 2100 

GTGCCAAGCC AGGGAATCCC AGT CCCAG AC TCAGAGCCCG GGCCTGCACT TTGCCCCCTG 2160 

CCCTTGATCA ACCCCACTGC CCCACCAGAG CTGCCAGGGT GGCACAGGGC CCTGTCCAGC 222 0 

CCCTGGCACA CACTTCCCTG CCAGGCCTCA GCCTCTAGCA TAAGCT CCAG AGAGCCAGGG 22 80 

CCCATCAGTT TCTCTCTGTG GAT TTGTATC TCAGCTCCAT GATGCCTTGG GCTTTCTGTC 234 0 

TCCTCAACAA GAGTGCAGCT TGCTGAATGT CAGCTGCCTG AGAGAGCTGG GGCCTGACTT 2400 

ACTAGGGCAT TAAATCCTAA GAGGTCCTAC TGAGGTGTGG CAGGATCACA GGCCAGTGGA 2460 

AAAAGGGCAG GTCAGATGGG CAAGG CCCAG GACTTTCAGA TTAACTGAGA GGATATCGAG 252 0 

GCCAAGCATG GCAGGGGGAA GGTCAGTGGG TGTCAAGAGA CCCAGGTCTG ACCCCGGATG 2580 

TTTGCTCCAT GTGACAAAAG CAGGCCTGTC TCAGGACCTT TTCTTTTCTT TTTTCCTTCT 2640 

TTTTTTTTTT GACACGGAGT TTCGCTCTTG TTGTCCAGGC TAGAGTGCAA TGGCATGATC 2 70 0 

CCAGCTCACC GCAACGTCTA CCTCCCAGGT TCAAATCATT CTCTTGCCTC AGACTCCCGA 2760 

GTAGCTGGGA TTACAGGCAC ATGCCACCAT GCCTGGCTAA TTTTGTATAT TTAGTAGAAA 2820 

CAGGGTTTCA CCATGCTGGC CATGCTGGTT CTCGAACTCC TGACCTCAGG TGTTCCACCT 2880 

ACCTCAGCCT CCCAAAGTGC TGGGGTTACA GGTGTGAGCC ATCGCGCCTG GCCAGGACCT 2 940 

TTGTTTCTTA TCTACATATT GGAAGATTTG GTCCTGATGT CCTTTGAGGC TTCTTTAGCT 3000 

CTAGTTCTCT GACACTT CAG CCTATATCAC AGCTAACTTC YTCAGTCTCA TCTATTCCTT 3060 

ATGCTCCAGC CCCTGGCAAT TTGCCTCAAG ATGGGGGTTT GAAAATAACT TTACCTGACT 3120 

CAAGGAGTGT CTGGAGCACC TCCTAGTCTA AGTCTGCAAG CTCCAGTTCT TGCCTAAAAC 3180 

CATGCCAGTG GCCACCCTTG GGCTCAGACA GCTCTGGGCC TTTTGACCAC AAGCCAGCCC 3240 

CTCGCCCTCT CTGTGGCATA GTCTTCTCTG CCCCAGGACT GCAGGGCGGC TTCCTCCAAG 3300 

GCTTCCAAGG CTCAAAAGAA ATTTGGCTCC AT CCAAGAAG GCTCCAGCTC CCCTACTGGC 3360 

CCCTGGCTTC AGGCCCACAC CCCTGGGCCA GGSCCAGAGA GTGTGTCTCA GGAGAATTCA 3420 

ATGGGCTCTA GAGAGACACA CAGAAAGTTT GGGCATTTGG GAAATTTTCA AGGRTGTATG 3480 



311 



WO 02/086443 

TATGGYTCAC GTATGGWGCA GGTTGTCCTG GTCCYKGGGT GCAGGGAAGT GGGCTGCAGG 3540 

GAAGTGGATT GGAGGGGAGC TTGAGGAATA TAAGGAGCGG GGGTGGAGAC TCAGGCTATG 3600 

GACAAGGACA GCCCCAAGGT TGGGAAGACC TGGCCTTAGT CGTCCTCAGC CTAGGGCAGG 3660 

GCAGTGAAGA AAGCTCTCCC CGCTCCTGCT GTAATGACCC AGAGTAGCCT CCCCAGGCCG 3720 

GCATCTTATG TGTGTCTTCC ACCATCCTCA TGGTGGCACT TTTCTAGGCC TGTCTCCCAG 3780 

CATTGTGCAA GGCTCGGAAG AGAACCAGGA AGTGAAACTG GGTGAAAACA GAAAGCTCAA 3 840 

TGGATGGGCT AGGTTCCCAG AT CAT T AGGG CAGAGTTTGC ACGTCCTCTG GTTCACTGGG 3 900 

AATCCACCCA GCCCACGAAT CATCTCCCTC TTTGAAGGAT TTTWATTTCT ACTGGGTTTT 3 960 

GGAACAAACT CCTGCTGAGA CCCCACAGCC AGAAACTGAA AGCAGCAGCT CCCCAAAGCC 4020 

TGGAAAATCC CTAAGAGAAG GCCTGGGGGA MAGGAAKTGG AGTGACAGGG GACAGGTAGA 4080 

GAGAAGGGGG CCCAATGGCC AGGGAGTGAA GGAGGTGGCG TTGCTGAGAG CAGTCTGCAC 4140 

ATGCTTCTGT CTGAGTG C AG GAAGGTGTTC CAGGGTCGAA ATTACACTTC TCGTACCTGG 4200 

AGACGCTGTT TGTGGGAGCA CTGGGCTCAT GCCTGGCACA CAATAGGTCT GCAATAAACC 4260 
ATGGTTAAAT CCTGAAAAAA AAAAAAAAA 

Seq ID NO: 333 Protein sequence 
Protein Accession #: NP 000011 



1 11 21 31 41 51 

I I I I I I 

MTLGSPRKGL LMLLMALVTQ GDPVKPSRGP LVTCTCESPH CKGPTCRGAW CTWLVREEG 60 

RHPQEHRGCG NLHRELCRGR PTEFVNHYCC DSHLCNHNVS IiVLEATQPPS EQPGTDGQLA 12 0 

LILGPVLALL ALVALGVLGL WHVRRRQEKQ RGLHSELGES SLILKASEQG DTMLGDLLDS 180 

DCTTGSGSGL PFLVQRTVAR Q VALVE CVGK GRYGEVWRGL WHGESVAVKI FSSRDEQSWF 240 

RETEIYNTVL LRHDNILGFI ASDMTSRNSS TQLWLITHYH EHGSLYDFLQ RQTLEPHLAL 300 

RLAVSAACGL AHLHVE I FGT QGKPAIAHRD FKSRNVLVKS NLQCCIADLG LAVMHSQGSD 360 

YLDIGNNPRV GTKRYMAPEV LDEQIRTDCF ESYKWTDIWA FGLVLWEIAR RTIVNGIVED 420 

YRPPFYDWP NDPSFEDMKK WCVDQQTPT IPNRLAADPV LSGLAQMMRE CWYPNPSARL 480 
TALRIKKTLQ KISNSPEKPK VIQ 

Seq ID NO: 3 34 DNA sequence 

Nucleic Acid Accession #: NM_004126.1 

Coding sequence: 108-329 

1 11 21 31 41 51 

I I I I I I 

GGCACGAGCT CGTGCCGGCC TTCAGTTGTT TCGGGACGCG CCGAGCTTCG CCGCTCTTCC 60 

AGCGGCTCCG CTGCCAGAGC TAGCCCGAGC CCGGTTCTGG GGCGAAAATG CCTGCCCTTC 12 0 

ACATCGAAGA TTTGCCAGAG AAGGAAAAAC TGAAAATGGA AGTTGAGCAG CTTCGCAAAG 180 

AAGTGAAGTT GCAGAGACAA CAAGTGT CTA AATGT TCTGA AGAAATAAAG AACTATATTG 240 

AAGAACGTTC TGGAGAGGAT CCTCTAGTAA AGGGAATTCC AGAAGACAAG AACCCCTTTA 3 00 

AAGAAAAAGG CAGCTGTGTT ATTTCATAAA TAACTTGGGA GAAACTGCAT CCTAAGTGGA 360 

AGAACTAGTT TGTTTTAGTT TTCCCAGATA AAACCAACAT GCTTTTTAAG GAAGGAAGAA 420 

TGAAAT TAAA AGGAGACTTT CTTAAGCACC ATATAGATAG GGTTATGTAT AAAAGCATAT 480 

GTGCTACTCA TCTTTGCTCA CTATGCAGT C TTTTTTAAGA GAGCAGAGAG TATCAGATGT 540 

ACAATTATGG AAATAAGAAC ATTACTTGAG CATGACACTT CTTTCAGTAT ATTGCTTGAT 600 
GCTTCAAATA AAGTTTTGTC TT 

Seq ID NO: 335 Protein sequence 
Protein Accession #: NP_004117.1 

1 11 21 31 41 51 

I I I I I I 

MPALHIEDLP EKEKLKMEVE QLRKEVKLQR QQVSKCSEEI KNYIEERSGE DPLVKGIPED 60 
KNPFKEKGSC VIS 



Seq ID NO: 336 DNA sequence 
Nucleic Acid Accession #: NM_005795 
Coding sequence: 555-1940 

1 11 21 31 41 51 

| I I 1 I I 

GCACGAGGGA ACAACCTCTC TCTCTSCAGC AGAGAGTGTC ACCTCCTGCT TTAGGACCAT 60 

CAAGCTCTGC TAACTGAATC TCAT CCTAAT TGCAGGATCA CATTGCAAAG CTTTCACTCT 120 

TTCCCACCTT GCTTGTGGGT AAATCTCTTC TGCGGAATCT CAGAAAGTAA AGTTCCATCC 180 

TGAGAATATT TCACAAAGAA TTTCCTTAAG AGCTGGACTG GGTCTTGACC CCTGGAATTT 240 

AAGAAATTCT TAAAGACAAT GTCAAATATG ATCCAAGAGA AAATGTGATT TGAGTCTGGA 300 

GACAATTGTG CATATCGTCT AATAATAAAA ACCCATACTA GCCTATAGAA AACAATATTT 360 

GAATAATAAA AACCCATACT AGCCTATAGA AAACAATATT TGAAAGATTG CTACCACTAA 42 0 

AAAGAAAACT ACTACAACTT GACAAGACTG CTGCAAACTT CAATTGGTCA CCACAACTTG 480 

ACAAGGTTGC TATAAAACAA GATTGCTACA ACTTCTAGTT TATGTTATAC AGCATATTTC 540 

ATTTGGGCTT AATGATGGAG AAAAAGTGTA CCCTGTATTT TCTGGTTCTC TTGCCTTTTT 60 0 

TTATGATTCT TGTTACAGCA GAATTAGAAG AGAGTCCTGA GGACTCAATT CAGTTGGGAG 660 

TTACTAGAAA TAAAATCATG ACAGCTCAAT ATGAATGTTA CCAAAAGATT ATGCAAGACC 720 

CCATTCAACA AGCAGAAGGC GTTTACTGCA ACAGAACCTG GGATGGATGG CTCTGCTGGA 780 

ACGATGTTGC AGCAGGAACT GAAT CAATGC AGCTCTGCCC TGATTACTTT CAGGACTTTG 840 

ATCCATCAGA AAAAGTTACA AAGATCTGTG ACCAAGATGG AAACTGGTTT AGACATCCAG 900 

CAAGCAACAG AACATGGACA AATTATACCC AGT GTAATGT TAACACCCAC GAGAAAGTGA 960 

AGACTGCACT AAATTTGTTT TACCTGACCA TAATTGGACA CGGATTGTCT ATTGCATCAC 102 0 

TGCTTATCTC GCTTGGCATA TTCTTTTATT TCAAGAGCCT AAGTTGCCAA AGGATTACCT 1080 

TACACAAAAA TCTGTTCTTC TCATTTGTTT GTAACTCTGT TGTAACAATC ATTCACCTCA 1140 

CTGCAGTGGC CAACAACCAG GCCTTAGTAG CCACAAATCC TGTTAGTTGC AAAGTGTCCC 12 00 

AGTTCATTCA TCTTTACCTG ATGGGCTGTA ATTACTTTTG GATGCTCTGT GAAGGCAT TT 12 60 

ACCTACACAC ACTCATTGTG GTGG CCGTGT TTGCAGAGAA GCAACATTTA ATGTGGTATT 1320 

ATTTTCTTGG CTGGGGATTT CCACTGATTC CTGCTTGTAT ACATGCCATT GCTAGAAGCT 1380 
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TATATTACAA TGACAATTGC TGGATCAGTT CTGATACCCA TCTCCTCTAC ATTATCCATG 1440 

GCCCAATTTG TGCTGCTTTA CTGGTGAATC TTTTTTTCTT GTTAAATATT GTACGCGTTC 1S00 

TCATCACCAA GTTAAAAGTT ACACACCAAG CGGAATCCAA TCTGTACATG AAAGCTGTGA 1560 

GAGCTACTCT TATCTTGGTG CCATTGCTTG GCATTGAATT TGTGCTGATT CCATGGCGAC 1620 

CTGAAGGAAA GATTGCAGAG GAGGTATATG ACTACATCAT GCACATCCTT ATGCACTTCC 1680 

AGGGTCTTTT GGTCTCTACC ATTTTCTGCT TCTTTAATGG AGAGGTTCAA GCAATTCTGA 1740 

GAAGAAACTG GAATCAATAC AAAATCCAAT TTGGAAACAG CTTTTCCAAC TCAGAAGCTC 1800 

TTCGTAGTGC GTCTTACACA GTGTCAACAA TCAGTGATGG TCCAGGTTAT AGT CATG ACT 1860 

GTCCTAGTGA ACACTTAAAT GGAAAAAGCA TCCATGATAT TGAAAATGTT CTCTTAAAAC 192 0 

CAGAAAATTT ATATAATTGA AAATAGAAGG ATGGTTGTCT CACTGTTTGG TGCTTCTCCT 1980 

AACTCAAGGA CTTGGACCCA TGACTCTGTA GCCAGAAGAC TTCAATATTA AATGACTTTG 2040 

GGGAATGTCA TAAAGAAGAG CCTTCACATG AAATTAGTAG TGTGTTGATA AGAGTGTAAC 2100 

ATCCAGCTCT ATGTGGGAAA AAAGAAATCC TGGTTTGTAA TGTTTGT CAG TAAATACTCC 2160 

CACTATGCCT GATGTGACGC TACTAACCTG ACATCACCAA GTGTGGAATT GGAGAAAAGC 2220 

ACAATCAACT TTTCTGAGCT GGTGTAAGCC AGT T C CAG CA CACCATTGAT GAATTCAAAC 2280 

AAATGGCTGT AAAACTAAAC ATACATGTTG GGCATGATTC TACCCTTATT CSCCCCAAGA 2340 

GACCTAGCTA AGGTCTATAA ACATGAAGGG AAAATTAGCT TTTAGTTTTA AAACTCTTTA 2400 

TCCCATCTTG ATTGGGGCAG TTGACTTTTT TTTTTTCCCA GAGTGCCGTA GTCCTTTTTG 2460 

TAACTACCCT CTCAAATGGA CAATACCAGA AGTGAATTAT CCCTGCTGGC TTTCTTTTCT 2520 

CTATGAAAAG CAACTGAGTA CAATTGTTAT GATCTACTCA TTTGCTGACA CATCAGTTAT 2580 

ATCTTGTGGC ATAT CCATTG TGGAAACTGG ATGAACAGGA TGTATAATAT G CAATCTT AC 2 640 

TTCTATATCA TTAGGAAAAC ATCTTAGTTG ATGCTACAAA ACACCTTGTC AACCTCTTCC 2700 

TGTCTTACCA AACAGTGGGA GGGAATTCCT AGCTGTAAAT ATAAATTTTG CCCTTCCATT 2760 

T CTACTGT AT AAACAAATTA GCAATCATTT TATATAAAGA AAATCAATGA AGGATTTCTT 2820 

ATTTTCTTGG AATTTTGTAA AAAGAAATTG TGAAAAATGA GCTTGTAAAT ACTCCATTAT 2880 

TTTATTTTAT AGTCTCAAAT CAAATACATA CAACCTATGT AATTTTTAAA G CAAAT AT AT 2 940 

AATGCAACAA TGTGTGTATG TTAATATCTG ATACTGTATC TGGGCTGATT TTTTAAATAA 3000 
AATAGAGTCT GGAATGCT 

Seq ID NO: 337 protein sequence 
Protein Accession #: NP_005786.1 

1 11 21 31 41 51 

I I I I 1 I 

MEKKCTLYFL VLLPFFMILV TAELEESPED SIQLGVTRNK IMTAQYECYQ KIMQDPIQQA 60 

EGVYCNRTWD GWLCWNDVAA GTESMQLCPD YFQDFDPSEK VTKICDQDGN WFRHPASNRT 12 0 

WTNYTQCNVN THEKVKTALN IiFYLTIIGHG LSIASLLISL GIFFYFKSLS CQRITLHKNL 180 

FFSFVCNSW T I I HLTAVAN NQALVATNPV SCKVSQFIHL YLMGCNYFWM LCEGIYLHTL 240 

IWAVFAEKQ HLMWYYFLGW GFPLIPACIH AIARSLYYND NCWISSDTHL LYIIHGPICA 300 

ALLVNLFFLL NIVRVLITKL KVTHQAESNL YMKAVRATL I LVPLLGIEFV LIPWRPEGKI 360 

AEEVYDYIMH ILMHFQGLLV STIFCFFNGE VQAILRRNWN QYKIQFGNSF SNSEALRSAS 42 0 
YTVSTISDGP GYSHDCPSEH LNGKSIHDIE NVLLKPENLY N 

Seq ID NOt 338 DNA sequence 
Nucleic Acid Accession #: NM_001795 
Coding sequence: 25-23 79 

1 11 21 31 41 51 

I 1 I I I I 

GCACGAT CTG TTCCTCCTGG GAAGATGCAG AGGCTCATGA TGCTCCTCGC CACATCGGGC 60 

GCCTGCCTGG GCCTGCTGGC AGTGGCAG CA GTGG CAG CAG CAGGTGCTAA CCCTGCCCAA 120 

CGGGACACCC ACAGCCTGCT GCCCACCCAC CGGCGCCAAA AGAGAGATTG GATTTGGAAC 180 

CAGATGCACA TTGATGAAGA GAAAAACACC TCACTTCCCC ATCATGTAGG CAAGATCAAG 240 

TCAAGCGTGA GTCGCAAGAA TGCCAAGTAC CTGCTCAAAG GAGAATATGT GGGCAAGGTC 3 00 

TTCCGGGTCG ATGCAGAGAC AGGAGACGTG TTCGCCATTG AGAGGCTGGA CCGGGAGAAT 3 60 

AT CT CAG AGT ACCACCTCAC TGCTGTCATT GTGGACAAGG ACACTGGTGA AAACCTGGAG 420 

ACTCCTTCCA GCTTCACCAT CAAAGTTCAT GACGTGAACG ACAACTGGCC TGTGTTCACG 480 

CATCGGTTGT TCAATGCGTC CGTGCCTGAG TCGTCGGCTG TGGGGACCTC AGTCATCTCT 540 

GTGACAGCAG TGGATGCAGA CGACCCCACT GTGGGAGACC ACGCCTCTGT CATGTACCAA 600 

ATCCTGAAGG GGAAAGAGTA TTTTGCCATC GATAATTCTG GACGTATTAT CACAATAACG 660 

AAAAGCTTGG ACCGAGAGAA GCAGGCCAGG TATGAGATCG TGGTGGAAGC GCGAGATGCC 720 

CAGGGCCTCC GGGGGGACTC GGGCACGGCC ACCGTGCTGG TCACTCTGCA AGACAT CAAT 780 

GACAACTTCC CCTTCTTCAC CCAGACCAAG TACACATTTG TCGTGCCTGA AGACACCCGT 840 

GTGGGCACCT CTGTGGGCTC TCTGTTTGTT GAGGACCCAG ATGAGCCCCA GAACCGGATG 900 

ACCAAGTACA GCATCTTGCG GG G CG AC T AC CAGGACGCTT TCACCATTGA GACAAACCCC 960 

GCCCACAACG AGGGCATCAT CAAGCCCATG AAGCCTCTGG ATTATGAATA CATCCAGCAA 1020 

TACAGCTTCA TCGTCGAGGC CACAGACCCC ACCATCGACC TCCGATACAT GAGCCCTCCC 1080 

GCGGGAAACA GAG CCCAGGT CATTATCAAC ATCACAGATG TGGACGAGCC CCCCATTTTC 1140 

CAGCAGCCTT TCTACCACTT CCAGCTGAAG GAAAACCAGA AGAAGCCTCT GATTGGCACA 12 00 

GTGCTGGCCA TGGACCCTGA TGCGGCTAGG CATAGCATTG GATACTCCAT CCGCAGGACC 12 60 

AGTGACAAGG GCCAGTTCTT CCGAGTCACA AAAAAGGGGG ACATTTACAA TGAGAAAGAA 132 0 

CTGGACAGAG AAGTCTACCC CTGGTATAAC CTGACTGTGG AGGCCAAAGA ACTGGATTCC 13 80 

ACTGGAACCC CCACAGGAAA AGAATCCATT GTGCAAGTCC ACATTGAAGT TTTGGATGAG 1440 

AATGACAATG CCCCGGAGTT TGCCAAGCCC TACCAGCCCA AAGTGTGTGA GAACGCTGTC 1500 

CATGGCCAGC TGGTCCTGCA GATCTCCGCA ATAGACAAGG ACATAACACC ACGAAACGTG 1560 

AAGTT CAAAT TCACCTTGAA TACTGAGAAC AACTTTACCC TCACGGATAA TCACGATAAC 162 0 

ACGGCCAACA TCACAGTCAA GTATGGGCAG TTTGACCGGG AGCATACCAA GGTCCACTTC 1680 

CTACCCGTGG TCATCTCAGA CAATGGGATG CCAAGTCGCA CGGGCACCAG CACGCTGACC 1740 

GTGGCCGTGT GCAAGTGCAA CGAGCAGGGC GAGTTCACCT TCTGCGAGGA TATGGCCGCC 1800 

CAGGTGGGCG TGAG CAT CCA GGCAGTGGTA GCCATCTTAC TCTGCATCCT CACCATCACA 1860 

GTGATCACCC TGCTCATCTT CCTGCGGCGG CGGCTCCGGA AGCAGGCCCG CGCGCACGGC 192 0 

AAGAGCGTGC CGGAGATCCA CGAGCAGCTG GTCACCTACG ACGAGGAGGG CGG CGGCG AG 1980 

ATGGACACCA CCAGCTACGA TGTGTCGGTG CTCAACTCGG TGCGCCGCGG CGGGGCCAAG 2 040 

CCCCCGCGGC CCGCGCTGGA CGCCCGGCCT TCCCTCTATG CGCAGGTGCA GAAGCCACCG 2100 

AGGCACGCGC CTGGGG CACA CGGAGGGCCC GGGGAGATGG CAGCCATGAT CGAGGTGAAG 2160" 

AAGGACGAGG CGGACCACGA CGGCGACGGC CCCCCCTACG ACACGCTGCA CAT CTACGGC 222 0 

TACGAGGGCT CCGAGTCCAT AGCCGAGTCC CTCAGCTCCC TGGG CACCGA CTCATCCGAC 22 80 
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TCTGACGTGG ATTACGACTT 
CTGTACGGCT CGGACCCCCG 
CTGGGGACCC AAACCCCCTG 
AAATGGCAGT GACTCCCCAG 
CCTTGGGATA GCAAACTCCA 
TTCTCAAATG CTGGCAAATC 
CTGTCACCCA CAGACCGCCG 
GCAAAACAGA CTGTGTTTAA 
TAAGGCTGGT GAGGTCCTGG 
TGTGGGGCAG GATTCTCTGC 
GGGAGCCCTA GCCCTGCTCC 
CCCTCTCCAG GCCTGTCAAG 
CTGAAGTGAC CTCACTGGCC 
ATTCAGGGAA ATGCTTATTA 
GAGATCAGGA GTGACAGATC 
AGGCCTGGAA GAGCTGAGAC 
AGAAGGGGCA GATGTTCCCG 
GCCAATCCAT GCTCTCTTTC 
CAAGATGTGG CCTTTAGCAA 
GCCGAGCATG TGTCTTTACA 
CACCTTGCAG AAGGAAGGCC 
ACTGGAACGT TTCACTGCAA 
AGGGAAGGAG ACACCAAGCT 
CCCTCACACT GCAAGGGATT 
TTCTTATAAT GATTTTTTTA 
GAATAAGGGT TTTTGCATAA 
TTTTTAGTTG GAAAAACAAT 
TACAGATAAT GT CT AT AT AT 
CCTAAATAAA GAAAAATCTT 



PCT/US02/12476 



CCTTAACGAC 
GGAGGAGCTG 
CAGCCCAGGC 
CCCAGCACCC 
GGTTCCTGAA 
CAGGCTGGTG 
TCTAACTCAA 
CTGCTGCAGG 
TGCCTATCTG 
AGCCCATTCC 
AACTCCATAC 
AGGGAGGAAG 
TGCCATGCCA 
AACCTTGAAG 
ACAGGGTGAG 
CTTGCTTTGA 
GAGATCAGAA 
TTTTCTGTGT 
AACTGACAAT 
CCTCGCTGTT 
CTGCCCTGCC 
ACACACCTTG 
CACCCTTCGT 
GTAGATAACA 
CTAATGATAC 
TAAGCAGGTT 
TCCTGTAACC 
TGGCCAAACT 
TAGCCTGGGC 



TGGGGACCCA 
CTGTATTAGG 
CAGTCAGACT 
CTTCCTCGTG 
ATATCCAGGA 
TTCTGTCTGG 
AGACTTCCTC 
GTCTTTTTCT 
CCTGGAGGCA 
CAAGGGAGAC 
TCCACTCCAA 
GGGCCCCATG 
GTAACTGTGC 
CAACTGTGAA 
GGCCACCTCC 
GACTCCTCAG 
GACGTCTCCC 
CTACTCCTTA 
GTCCAAACCC 
GTCACATCTC 
CAACCTCTGT 
GAGAAGTGGC 
CATGGACCGA 
CTGACTTGTT 
TTACAAGTTT 
GTTATTTAGG 
TTCTATTTTC 
GGTGCATGAC 
AACAAAAAAA 



GGTTTAAGAT 
CGGCCGAGGT 
CCAGGCACCA 
GGTCCCAGAG 
AT ATATGT CA 
GCTCAGACAT 
TGGCTCCCCA 
AGGGTCCCTG 
AAGGCCTGGA 
TGACCATCAT 
GTGCCCCACC 
GCAGCTCCTG 
TGTACTGAGC 
TTCATTCTGG 
ACACCCACCC 
CACCCCTCCA 
CTTCTCTGCC 
TCCCTTGGTT 
ACTCATGACT 
AGGGAACTGA 
GGTCACCCAT 
ATCAGTCAAC 
GGTTCCCACT 
TGTTTTAACC 
CTAGCTCTCA 
TTAACAATAT 
TATAATTGTA 
AAGTACTGTA 



GCTGGCTGAG 2340 

CACTCTGGGC 2400 

CAGCCTCCAA 2460 

ACCTCATCAG 2 520 

GTG ATGACTA 2580 

CCACAT AACC 2640 

AGGCTGCAAA 2700 

AACGCCCTGG 2760 

CAGCTTGACT 2 82 0 

GCCCTCTCTC 2 880 

ACTCCCCAAC 2 940 

ACCTTGGGTC 3000 

ACTGAACCAC 3060 

AGGGGCAGTG 3120 

CCTCTGGAGA 3180 

GTTTTGCCTG 3240 

TCACCTGGTC 33 00 

TAGAGGAACC 3360 

GCATGACGGA 3420 

CCCTCAGGCA 3480 

GCATCATTCC 3540 

AGAGAGGGGC 3600 

CTGGCAAAGC 3660 

AATAACTAGC 3 72 0 

CAGACATATA 3 780 

TAATTCAGGT 3840 

GTAATTGCTC 3 900 

TTTTTTTATA 3 960 



Seq ID NO: 33 9 Protein sequence 
Protein Accession #: NP 001786 
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MQRLMMLLAT 
NT S L PHHVGK 
VIVDKDTGEN 
PTVGDHASVM 
TATVLVTLQD 
DYQDAFTIET 
INITDVDEPP 
VTKKGDIYNE 
KPYQPKVCEN 
GQFDREHTKV 
WAILLCILT 
SVLNSVRRGG 
DGPPYDTLHI 
ELLY 



11 
I 

SGACLGLLAV 
IKSSVSRKNA 
LETPSSFTIK 
YQILKGKEYF 
INDNFPFFTQ 
NPAHNEGI IK 
IFQQPFYHFQ 
KELDREVYPW 
AVHGQLVLQI 
HFLPWI SDN 
ITVITLLIFL 
AKPPRPALDA 
YGYEGSESIA 



21 
I 

AAVAAAGANP 
KYLLKGEYVG 
VHDVNDNWPV 
AIDNSGRIIT 
TKYTFWPED 
PMKPIjD YE Y I 
LKENQKKPLI 
YNLTVEAKEL 
SAIDKDITPR 
GMPSRTGTST 
RRRLRKQARA 
RPSLYAQVQK 
ESLSSLGTDS 



31 



AQRDTHSLLP 
KVFRVDAETG 
FTHRLFNASV 
ITKSLDREKQ 
TRVGTSVGSL 
QQYSFIVEAT 
GT VL AMD PD A 
DSTGTPTGKE 
NVKFKFTLNT 
LTVAVCKCNE 
HGKSVPEIHE 
PPRHAPGAHG 
SDSDVDYDFL 



41 
1 

THRRQKRDWI 
DVFAIERLDR 
PESSAVGTSV 
AR YE I WEAR 
FVEDPDEPQN 
DPTIDLRYMS 
ARHSIGYSIR 
SIVQVHIEVIi 
ENNFTLTDNH 
QGEFTFCEDM 
QLVTYDEEGG 
GPGEMAAMIE 
NDWGPRFKML 



51 
] 

WNQMHIDEEK 60 

ENISEYHLTA 120 

I SVTAVDADD 180 

DAQGLRGDSG 240 

RMTKYSILRG 300 

PPAGNRAQVI 3 60 

RTSDKGQFFR 420 

DENDNAPEFA 480 

DNTANITVKY 540 

AAQVGVSIQA 600 

GEMDTTSYDV 660 

VKKDEADHDG 720 

AELYGSDPRE 780 



55 



Seq ID NO: 340 DNA sequence 
Nucleic Acid Accession #: NM_003088 
Coding sequence: 112-1593 
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GCGGAGGGTG 
CCCGCCACCC 
AACGG C ACAG 
CTGACGGCCG 
CAGATCTGGA 
AGCCACCTGG 
GTGCCCGGTC 
CAGTCCGAGG 
CAGACGGTGT 
ATCTACAGTG 
GCCGTGGACC 
CAGCGCTACA 
GCGCGCCCCG 
CGCGACTGCG 
AAGGCCACCA 
GTGCTGCAGG 
AATCAGGACG 
AAGTGTGCCT 
CAGTCCACCG 
CGCATCACAC 
GCCGCCTCGG 
CCCATCATCG 
CTGGACGCCA 
AACATCAAAG 
AGCGGCGACA 
AAGGTGGGCG 
ACCGTGGACC 
CCACATGGCG 
GGCGGGAGGC 
CCTGTCGCCC 



11 
I 

CGTGCGGGCC 
ACCTCCCGGG 
CCGAGGCGGT 
AGGCGTTCGG 
CGCTGGAGCA 
GCCGCTACCT 
CCGACTGCCG 
CGCACCGGCG 
CCCCCGCCGA 
TCACCCGTAA 
GCGACGTGCC 
GCGTGCAGAC 
AGCCGGCCAC 
AGGGCCGTTA 
AGGTGGGCAA 
CGGCCAACGA 
AGGAGACCGA 
TCCGTACCCA 
CCTCCAGCAA 
TGAGGGCGTC 
TGGAGACAGC 
TGTTCCGCGG 
ACCGCTCCAG 
ACTCCACAGG 
CTCCTGTGGA 
GGCGCTACCT 
CCGCCTCGCT 
GCTCCTGCCA 
AAGCCCCCTT 
CTATGGACTC 



21 
I 

GCGGCAGCCG 
GCCGCGCAGC 
GCAGATCCAG 
GTTCAAGGTG 
GCCCCCTGAC 
GGCGGCGGAC 
TTTCCTCATC 
CTACTTCGGC 
GAAGTGGAGC 
GCGCTACGCG 
CTGGGGCGTC 
CGCCGACCAC 
TGGCTACACG 
CCTGGCGCCG 
GGACGAGCTC 
GAGGAACGTG 
CCAGGAGACC 
CACGGGCAAG 
GAATGCCAGC 
CAATGG CAAG 
AGGGGACTCA 
GGAGCATGGC 
CTATGACGTC 
CAAATACTGG 
CTTCTTCTTC 
GAAGGGCGAC 
CTGGGAGTAC 
ACCCTCCCTG 
GCCTTTCAAA 
CCCACTCTCC 



31 
I 

AACAAAGGAG 
GGCCTCTCGT 
TTCGGCCTCA 
AACGCGTCCG 
GAGGCGGGCA 
AAGGACGGCA 
GTGGCGCACG 
GGCACCGAGG 
GTGCACATCG 
CACCTGAGCG 
GACTCGCTCA 
CGCTTCCTGC 
CTGGAGTTCC 
TCGGGGCCCA 
TTTGCTCTGG 
TCCACGCGCC 
TTCCAGCTGG 
TACTGGACGC 
TGCTACTTTG 
TTTGTGACCT 
GAGCTCTTCC 
TTCATCGGCT 
TTCCAGCTGG 
ACGGTGGGCA 
GAGTTCTGCG 
CACGCAGGCG 
TAGGGCCGGC 
CTAACCCCTT 
CTGGAAACCC 
CCTCCGCCCG 



41 

I 

CAGGGGCGCC 
CTACTGCCAC 
TCAACTGCGG 
CCAGCAGCCT 
GCGCGGCCGT 
ACGTGACCTG 
ACGACGGTCG 
ACCGCCTGTC 
CCATGCACCC 
CGCGGCCGGC 
TCACCCTCGC 
GCCACGACGG 
GCTCCGGCAA 
GCGGCACGCT 
AGCAGAGCTG 
AGGGTATGGA 
AGAT CGACCG 
TGACGGCCAC 
ACATCGAGTG 
CCAAGAAGAA 
TCATGAAGCT 
GCCGCAAGGT 
AGTTCAACGA 
GTGACTCCGC 
ACTATAACAA 
TCCTGAAGGC 
CCGTCCTTCC 
CTCCGCCAGG 
CAGAGAAAAC 
GGTTCCCTAC 



51 
I 

GCCGCAGGGA 60 

CATGACCGCC 12 0 

CAACAAGTAC 180 

GAAGAAGAAG 2 40 

GTGCCTGCGC 3 00 

CGAGCGCGAG 3 60 

CTGGTCGCTG 420 

CTGCTTCGCG 4 8 0 

TCAGGTCAAC 540 

CGACGAGATC 600 

CTTCCAGGAC 660 

GCGCCTGGTG 720 

GGTGGCCTTC 7 80 

CAAGGCGGGC 840 

CGCCCAGGTC 900 

CCTGTCTGCC 960 

CGACACCAAA 102 0 

CGGGGGCGTG 1080 

GCGTGACCGG 1140 

TGGGCAGCTG 1200 

CATCAACCGC 1260 

CACGGGCACC 1320 

TGGCGCCTAC 13 80 

GGTCACCAGC 1440 

GGTGGCCATC 1500 

CTCGGCGGAA 1560 

CCGCCCCTGC 1620 

TGGGCTCCAG 1680 

GGTGCCCCCA 1740 

TCCCCTCGGG 1800 



314 



WO 02/086443 

TCAGCGGCTG CGGCCTGGCC CTGGGAGGGA TTTCAGATGC CCCTGCCCTC TTGTCTGCCA 1860 

CGGGGCGAGT CTGGCACCTC TTTCTTCTGA CCTCAGACGG CTCTGAGCCT TATTTCTCTG 192 0 

GAAGCGGCTA AGGGACGGTT GGGGGCTGGG AGCCCTGGGC GTGTAGTGTA ACTGGAATCT 1980 

TTTGCCTCTC CCAGCCACCT CCTCCCAGCC CCCCAGGAGA GCTGGGCACA TGT CCCAAGC 2040 

CTGTCAGTGG CCCTCCCTGG TGCACTGTCC CCGAAACCCC TGCTTGGGAA GGGAAGCTGT 2100 

CGGGAGGGCT AGGACTGACC CTTGTGGTGT TTTTTTGGGT GGTGGCTGGA AACAGCCCCT 2160 

CTCCCACGTG GGAGAGGCTC AGCCTGGCTC CCTTCCCTGG AGCGGCAGGG CGTGACGGCC 222 0 

ACAGGGTCTG CCCGCTGCAC GTTCTGCCAA GGTGGTGGTG GCGGGCGGGT AGGGGTGTGG 2280 

GGGCCGTCTT CCTCCTGTCT CTTTCCTTTC ACCCTAGCCT GACTGGAAGC AGAAAATGAC 2 340 

CAAATCAGTA TTTTTTTTAA TGAAATATTA TTGCTGGAGG CGTCCCAGGC AAGCCTGGCT 240 0 

GTAGTAGCGA GTGATCTGGC GGGGGGCGTC TCAGCACCCT CCCCAGGGGG TGCATCTCAG 2460 

CCCCCTCTTT CCGTCCTTCC CGTCCAGCCC CAGCCCTGGG CCTGGGCTGC CGACACCTGG 2 52 0 

GCCAGAGCCC CTGCTGTGAT TGGTGCTCCC TGGGCCTCCC GGGTGGATGA AGCCAGGCGT 2 5 80 

CGCCCCCTCC GGGAGCCCTG GGGTGAGCCG CCGGGGCCCC CCTGCTGCCA GCCTCCCCCG 2 640 

TCCCCAACAT GCATCTCACT CTGGGTGTCT TGGTCTTTTA TTTTTTGTAA GTGTCATTTG 270 0 

TATAACTCTA AACGCCCATG ATAGTAGCTT CAAACTGGAA ATAGCGAAAT AAAATAACTC 2 760 
AGTCTGC 

Seq ID NO: 341 Protein sequence 
Protein Accession #: NP_003079 

1 11 21 31 41 51 

I 1 I I I I 

MTANGTAEAV QIQFGLINCG NKYLTAEAFG FKVNASASSL KKKQIWTLEQ PPDEAGSAAV 60 

CLRSHLGRYL AADKDGNVTC EREVPGPDCR FL I VAHDDGR WSLQSEAHRR YFGGTEDRLS 120 

CFAQTVSPAE KWSVHIAMHP QVNIYSVTRK RYAHLSARPA DEIAVDRDVP WGVDSLITLA 180 

FQDQRYSVQT ADHRFLRHDG RL VARPE PAT GYTLEFRSGK VAFRDCEGRY LAPSGPSGTL 240 

KAGKATKVGK DELFALEQSC AQWLQAANE RNVSTRQGMD LSANQDEETD QETFQLEIDR 300 

DTKKCAFRTH TGKYWTLTAT GGVQSTASSK NASCYFDIEW RDRRITLRAS NGKFVTSKKN 360 

GQLAASVETA GDSELFLMKL INRPIIVFRG EHGFIGCRKV TGTLDANRSS YDVFQLEFND 420 

GAYNIKDSTG KYWTVGSDSA VTSSGDTPVD FFFEFCDYNK VAIKVGGRYL KGDHAGVLKA 480 
SAETVDPASL WEY 



Seq ID NO: 342 DNA sequence 

Nucleic Acid Accession #: FGENESH predicted 
Coding sequence : 660 1705 

1 11 21 31 41 51 

I 1 1 ! I I 

CGCTCCGCAC ACATTTCCTG TCGCGGCCTA AGGGAAACTG TTGGCCGCTG GGCCCGCGGG 60 

GGGATTCTTG GCAGTTGGGG GGTCCGTCGG GAGCGAGGGC GGAGGGGAAG GGAGGGGGAA 120 

CCGGGTTGGG GAAGCCAGCT GTAGAGGGCG GTGACCGCGC TCCAGACACA GCTCTGCGTC 180 

CTCGAGCGGG ACAGATCCAA GTTGGGAGCA GCTCTGCGTG CGGGGCCTCA GAGAATGAGG 240 

CCGGCGTTCG CCCTGTGCCT CCTCTGGCAG GCGCTCTGGC CCGGGCCGGG CGGCGGCGAA 3 00 

CACCCCACTG CCGACCGTGC TGGCTGCTCG GCCTCGGGGG CCTGCTACAG CCTGCACCAC 3 60 

GCTACCATGA AGCGGCAGGC GGCCGAGGAG GCCTGCATCC TGCGAGGTGG GGCGCTCAGC 420 

ACCGTGCGTG CGGGCGCCGA GCTGCGCGCT GTGCTCGCGC TCCTGCGGGC AGGCCCAGGG 480 

CCCGGAGGGG GCTCCAAAGA CCTGCTGTTC TGGGTCGCAC TGGAGCGCAG GCGTTCCCAC 540 

TGCACCCTGG AGAACGAGCC TTTGCGGGGT TTCTCCTGGC TGTCCTCCGA CCCCGGCGGT 600 

CTCGAAAGCG ACACGCTGCA GTGG GTGG AG GAGCCCCAAC GCTCCTGCAC CGCGCGGAGA 660 

TGCGCGGTAC TCCAGGCCAC CGGTGGGGTC GAGCCCGCAG CTGGAAGGAG ATGCGATGCC 720 

ACCTGCGCGC CAACGGCTAC CTGTGCAAGT ACCAGTTTGA GGTCTTGTGT CCTGCGCCGC 780 

GCCCCGGGGC CGCCTCTAAC TTGAGCTATC GCGCGCCCTT CCAGCTGCAC AGCGCCGCTC 840 

TGGACTTCAG TCCACCTGGG ACCGAGGTGA GTGCGCTCTG CCGGGGACAG CTCCCGATCT 900 

CAGTTACTTG CATCGCGGAC GAAATCGGCG CTCGCTGGGA CAAACTCTCG GGCGATGTGT 960 

TGTGTCCCTG CCCCGGGAGG TACCTCCGTG CTGGCAAATG CGCAGAGCTC CCTAACTGCC 1020 

TAGACGACTT GGGAGGCTTT GCCTGCGAAT GTGCTACGGG CTTCGAGCTG GGGAAGGACG 1080 

GCCGCTCTTG TGTGACCAGT GGGGAAGGAC AGCCGACCCT TGGGGGGACC GGGGTGCCCA 1140 

CCAGGCGCCC GCCGGCCACT GCAACCAGCC CCGTGCCGCA GAGAACATGG CCAATCAGGG 1200 

TCGACGAGAA GCTGGGAGAG ACACCACTTG TCCCTGAACA AGACAATTCA GTAACATCTA 1260 

TTCCTGAGAT TCCTCGATGG GG AT CAGAG A GCACGATGTC TACCCTTCAA ATGTCCCTTC 1320 

AAGCCGAGTC AAAGGCCACT ATCACCCCAT CAGGGAGCGT GATTT CCAAG TTTAATTCTA 13 80 

CGACTTCCTC TGCCACTCCT CAGGCTTTCG ACTCCTCCTC TGCCGTGGTC TTCATATTTG 1440 

TGAGCACAGC AGTAGTAGTG TTGGTGATCT TGACCATGAC AGTACTGGGG CTTGTCAAGC 1500 

TCTGCTTTCA CGAAAGCCCC TCTTCCCAGC CAAGGAAGGA GTCTATGGGC CCGCCGGGCC 1560 

TGGAGAGTGA TCCTGAGCCC GCTGCTTTGG GCTCCAGTTC TGCACATTGC ACAAACAATG 1620 

GGGTGAAAGT CGGGGACTGT GATCTGCGGG ACAGAGCAGA GGGTGCCTTG CTGGCGGAGT 1680 
CCCCTCTTGG CTCTAGTGAT G CAT AG 

Seq ID NO: 343 Protein sequence 
Protein Accession #: FGENESH predicted 

1 11 21 31 41 51 

I I I l I I 

MGKDFMTKTP KAFATKAKID KWDLIKLKSF CTAKETI IRV NSQPTDWQKT FAIYPSDKGV 60 

IARIYKELEQ IYKKKKPTKT LRTHFLSRPK GNCWPLGPRG DSWQLGGPSG ARAEGKGGGT 12 0 

GLGKPAVEGG DRAPDTAIiRP RAGQIQVGSS SACGASENEA GVRPVPPLAG ALARAGRRRT 180 

PHCRPCWLLG LGGLLQPAPR YHEAAGGRGG LHPARWGAQH RACGRRAARC ARAPAGRPRA 240 

RRGLQRPAVL GRTGAQ AF P L HPGERAFAGF LLAVLRPRRS RKRHAAVGGG APTLLHRAEM 300 

RGT PGHRWGR ARSWKEMRCH LRANGYLCKY QFEVLCPAPR PGAASNLSYR APFQLHSAAL 360 

DFSPPGTEVS ALCRGQLPIS VTCIADEIGA RWDKLSGDVL CPCPGRYLRA GKCAELPNCL 420 

DDLGGFACEC ATGFELGKDG RSCVTSGEGQ PTLGGTGVPT RRPPATATSP VPQRTWPIRV 480 

DEKLGETPLV PEQDNSVTSI PEIPRWGSQS TMSTLQMSLQ AESKATITPS GSVISKFNST 540 

TSSATPQAFD SSSAWFIFV STAWVLVIL TMTVLGLVKL CFHESPSSQP RKESMGPPGL 600 
ESDPEPAALG SSSAHCTNNG VKVGDCDLRD RAEGALLAES PLGSSDA 



315 



WO 02/086443 



Seq ID NO: 344 DNA sequence 
Nucleic Acid Accession #: NM_012072 
Coding sequence: 149-2107 

1 . 11 21 31 41 51 

AAAGCCCTCA GCCTTTGTGT CCTTCTCTGC GCCGGAGTGG CTGCAGCTCA CCCGTCAGCT 60 
CCCCTTGGGG CCCAGCTGGG AGCCGAGATA GAAGCTCCTG TCGCCGCTGG GCTTCTCGCC 120 
TCCCGCAGAG GGCCACACAG AGACCGGGAT GGCCACCTCC ATGGGCCTGC TGCTGCTGCT 180 
GCTGCTGCTC CTGACCCAGC CCGGGGCGGG GACGGGAGCT GACACGGAGG CGGTGGTCTG 240 
CGTGGGGACC GCCTGCTACA CGGCCCACTC GGGCAAGCTG AGCGCTGCCG AGGCCCAGAA 300 
CCACTGCAAC CAGAACGGGG GCAACCTGGC CACTGTGAAG AGCAAGGAGG AGGCCCAGCA 360 
CGTCCAGCGA GTACTGGCCC AGCTCCTGAG GCGGGAGGCA GCCCTGACGG CGAGGATGAG 420 
CAAGTTCTGG ATTGGGCTCC AGCGAGAGAA GGGCAAGTGC CTGGACCCTA GTCTGCCGCT 480 
GAAGGGCTTC AGCTGGGTGG GCGGGGGGGA GGACACGCCT TACTCTAACT GGCACAAGGA 540 
GCTCCGGAAC TCGTGCATCT CCAAGCGCTG TGTGTCTCTG CTGCTGGACC TGTCCCAGCC 600 
GCTCCTTCCC AACCGCCTGC CCAAGTGGTC TGAGGGCCCC TGTGGGAGCC CAGGCTCCCC 660 
CGGAAGTAAC ATTGAGGGCT TCGTGTGCAA GTTCAGCTTC AAAGGCATGT GCCGGCCTCT 720 
GGCCCTGGGG GGCCCAGGTC AGGTGACCTA CACCACCCCC TTCCAGACCA CCAGTTCCTC 780 
CTTGGAGGCT GTGCCCTTTG CCTCTGCGGC CAATGTAGCC TGTGGGGAAG GTGACAAGGA 840 
CGAGACTCAG AGTCATTATT TCCTGTGCAA GGAGAAGGCC CCCGATGTGT TCGACTGGGG 900 
CAGCTCGGGC CCCCTCTGTG TCAGCGCCAA GTATGGCTGC AACTTCAACA ATGGGGGCTG 960 
CCACCAGGAC TGCTTTGAAG GGGGGGATGG CTCCTTCCTC TGCGGCTGCC GACCAGGATT 1020 
CCGGCTGCTG GATGACCTGG TGACCTGTGC CTCTCGAAAC CCTTGCAGCT CCAGCCCATG 1080 
TCGTGGGGGG GCCACGTGCG TCCTGGGACC CCATGGGAAA AACTACACGT GCCGCTGCCC 1140 
CCAAGGGTAC CAGCTGGACT CGAGT CAGCT GGACTGTGTG GACGTGGATG AATGCCAGGA 1200 
CTCCCCCTGT GCCCAGGAGT GTGTCAACAC CCCTGGGGGC TTGCGCTGCG AATGCTGGGT 1260 
TGGCTATGAG CCGGGCGGTC CTGGAGAGGG GGCCTGTCAG GATGTGGATG AGTGTGCTCT 1320 
GGGTCGCTCG CCTTGCGCCC AGGGCTGCAC CAACACAGAT GGCTCATTTC ACTGCTCCTG 1380 
TGAGGAGGGC TACGTCCTGG CCGGGGAGGA CGGGACTCAG TGCCAGGACG TGGATGAGTG 144 0 
TGTGGGCCCG GGGGGCCCCC TCTGCGACAG CTTGTGCTTC AACACACAAG GGTCCTTCCA 1500 
CTGTGGCTGC CTGCCAGGCT GGGTGCTGGC CCCAAATGGG GTCTCTTGCA CCATGGGGCC 1560 
TGTGTCTCTG GGACCAC CAT CTGGGCCCCC CGATGAGGAG GACAAAGGAG AGAAAGAAGG 1620 
GAGCACCGTG CCCCGCGCTG CAACAGCCAG TCCCACAAGG GGCCCCGAGG GCACCCCCAA 1680 
GGCTACACCC AC C AC AAGT A GACCTTCGCT GTCATCTGAC GCCCCCATCA CATCTGCCCC 17 40 
ACTCAAGATG CTGGCCCCCA GTGGGTCCTC AGGCGT CTGG AGGGAGCCCA GCATCCATCA 180 0 
CGCCACAGCT GCCTCTGGCC CCCAGGAGCC TGCAGGTGGG GACTCCTCCG TGGCCACACA 1860 
AAACAACGAT GGCACTGACG GGCAAAAGCT GCTTTTATTC TACATCCTAG GCACCGTGGT 192 0 
GGCCATCCTA CTCCTGCTGG CCCTGGCTCT GGGGCTACTG GTCTATCGCA AGCGGAGAGC 1980 
G AAGAGG GAG GAGAAGAAGG AGAAGAAGCC CCAGAATGCG GCAGACAGTT ACTCCTGGGT 2 040 
TCCAGAGCGA GCTGAGAGCA GGGCCATGGA GAACCAGTAC AGTCCGACAC CTGGGACAGA 210 0 
CTGCTGAAAG TGAGGTGGCC CTAGAGACAC TAGAGTCACC AGCCACCATC CTCAGAGCTT 2160 
TGAACTCCCC ATTCCAAAGG GGCACCCACA TTTTTTTGAA AGACTGGACT GGAATCTTAG 222 0 
CAAACAATTG TAAGTCTCCT CCTTAAAGGC CCCTTGGAAC ATGCAGGTAT TTTCTACGGG 2280 
TGTTTGATGT TCCTGAAGTG GAAGCTGTGT GTTGGCGTGC CACGGTGGGG ATTTCGTGAC 2340 
TCTATAATGA TTGTTACTCC CCCTCCCTTT TCAAATTCCA ATGTGACCAA TTCCGGATCA 240 0 
GGGTGTGAGG AGGCTGGGGC TAAGGGGCTC CCCTGAATAT CTTCTCTGCT CACTTCCACC 2460 
ATCTAAGAGG AAAAGGTGAG TTGCTCATGC TGATTAGGAT TGAAATGATT TGTTTCTCTT 2520 
CCTAGGATGA AAACTAAATC AATTAATTAT TCAATTAGGT AAGAAGATCT GGTTTTTTGG 2580 
TCAAAGGGAA CATGTTCGGA CTGGAAACAT TTCTTTACAT TTGCATTCCT CCATTTCGCC 2640 
AGCACAAGTC TTGCTAAATG TGATACTGTT GACATCCTCC AGAATGGCCA GAAGTGCAAT 2700 
TAACCTCTTA GGTGGCAAGG AGGCAGGAAG TGCCTCTTTA GTTCTTACAT TTCTAATAGC 2760 
CTTGGGTTTA TTTGCAAAGG AAG CTTG AAA AATATGAGAA AAGTTGCTTG AAGTGCATTA 2820 
CAGGTGTTTG TGAAGTCACA TAATCTACGG GGCTAGGGCG AGAGAGGCCA GGGATTTGTT 2880 
CACAGATACT TGAATTAATT CATCCAAATG TACTGAGGTT ACCACACACT TGACTACGGA 2 940 
TGTGATCAAC ACTAACAAGG AAACAAATTC AAGGACAACC TGTCTTTGAG CCAGGGCAGG 3000 
CCTCAGACAC CCTGCCTGTG GCCCCGCCTC CACTTCATCC TGCCCGGAAT GCCAGTGCTC 3060 
CGAGCTCAGA CAGAGGAAGC CCTGCAGAAA GTTCCATCAG GCTGTTTCCT AAAGGATGTG 3120 
TGAACGGGAG ATGATGCACT GTGTTTTGAA AGTTGTCATT TTAAAGCATT TTAGCACAGT 3180 
TCATAGTCCA CAGTTGATGC AGCATCCTGA GATTTTAAAT CCTGAAGTGT GGGTGGCGCA 3240 
CACACCAAGT AGGGAGCTAG TCAGGCAGTT TGCTTAAGGA ACTTTTGTTC TCTGTCTCTT 3300 
TTCCTTAAAA TTGGGGGTAA GGAGGGAAGG AAGAGGGAAA GAGATGACTA ACTAAAATCA 3360 
TTTTTACAGC AAAAACTGCT CAAAGCCATT TAAAT TAT AT CCTCATTTTA AAAGTTACAT 3420 
TTGCAAATAT TTCTCCCTAT GATAATGCAG TCGATAGTGT GCACTCTTTC TCTCTCTCTC 3 480 
TCTCTCTCAC ACACACACAC ACACACACAC ACACACACAC AGAGACACGG CACCATTCTG 3540 
CCTGGGGCAC TGGAACACAT TCCTGGGGGT CACCGATGGT CAGAGTCACT AGAAGTTACC 3 600 
TGAGTATCTC TGGGAGGCCT CATGTCTCCT GTGGGCTTTT TACCACCACT GTGCAGGAGA 3660 
ACAGACAGAG GAAATGTGTC TCCCTCCAAG GCCCCAAAGC CTCAGAGAAA GGGTGTTTCT 3720 
GGTTTTGCCT TAGCAATGCA TCGGTCTCTG AGGTGACACT CTGGAGTGGT TGAAGGGCCA 3780 
CAAGGTGCAG GGTTAATACT CTTGCCAGTT TTGAAATATA GATGCTATGG TTCAGATTGT 3 840 
TTTTAATAGA AAACTAAAGG GGCAGGGGAA GTGAAAGGAA AGATGGAGGT TTTGTGCGGC 3900 
TCGATGGGGC ATTTGGAACT TCTTTTTAAA GTCATCTCAT GGTCTCCAGT TTTCAGTTGG 3960 
AACTCTGGTG TTTAACACTT AAGGGAGACA AAGGCTGTGT CCATTTGGCA AAACTTCCTT 4020 
GGCCACGAGA CTCTAGGTGA TGTGTGAAGC TGGGCAGTCT GTGGTGTGGA GAGCAGCCAT 4080 
CTGTCTGGCC ATTCAGAGGA TTCTAAAGAC ATGGCTGGAT GCGCTGCTGA CCAACATCAG 4140 
CACTTAAATA AATGCAAATG CAACATTTCT CCCTCTGGGC CTTGAAAATC CTTGCCCTTA 4200 
TCATTTGGGG TGAAGGAGAC ATTTCTGTCC TTGGCTTCCC ACAGCCCCAA CGCAGTCTGT 4260 
GTATGATTCC TGGGATCCAA CGAGCCCTCC TATTTTCACA GTGTTCTGAT TGCTCTCACA 432 0 
GCCCAGGCCC ATCGTCTGTT CTCTGAATGC AGCCCTGTTC TCAACAACAG GGAGGTCATG 43 80 
GAACCCCTCT GTGGAACCCA CAAGGGGAGA AATGGGTGAT AAAGAATCCA GTTCCTCAAA 4440 
ACCTTCCCTG GCAGGCTGGG TCCCTCTCCT GCTGGGTGGT GCTTTCTCTT GCACACCACT 4500 
CCCACCACGG GGGGAGAGCC AGCAACCCAA CCAGACAGCT CAGGTTGTGC ATCTGATGGA 4560 
AACCACTGGG CTCAAACACG TGCTTTATTC TCCTGTTTAT TTTTGCTGTT ACTTTGAAGC 4620 
ATGGAAATTC TTGTTTGGGG GATCTTGGGG CTACAGTAGT GGGTAAACAA ATGCCCACCG 4680 
GCCAAGAGGC CATTAACAAA TCGTCCTTGT CCTGAGGGGC CCCAGCTTGC TCGGGCGTGG 4740 
CACAGTGGGG AATCCAAGGG TCACAGTATG GGGAGAGGTG CACCCTGCCA CCTGCTAACT 4800 
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TCTCGCTAGA CACAGTGTTT 
CATGGGGACG GGGGAAGTTT 
CCAAATAGGT CAATAATTCT 
TCTCTCCCTC CCCTCATCCC 
CACCCAGCTC GCCATGCCTA 
CTTCTTTGTC ATTTGAGAAA 
CAGAAAAACC AGGGCAGGAC 
TAGAGGGACT CCACCCCTGC 
CTCTGCCTTC GGTGGCCCAC 
AACACATCTA CGTGTAGCAC 
AGGCTCTGAT TAAGGATGTG 
CTGGAGGCCT GTCTGTTAGC 
TGCCATCTTC CCTGCGATCA 
TGTGTTATGT CCATTTTGCA 
TTGCTTTGTC TTTTCCATCC 
TCTTTCGATG GATGGAGATG 
ATTTCTGTGA AAACTAGGAG 
TAACACAGTC TTTTTAAAAC 
TCTCCATTGT CTAAATCAGG 
TTAATGCCCC CTACATATTT 
TATGATCCCA GAAAACATCT 
TGGTTTGTGC ATTTTCTCAA 
CTAAT CAAAG ACACTATTTT 
TTTAAAAATA AATTGTGTTT 
AAGCTCTGGA ATCCCTTTAT 
TTCAGCAGAT TTTGCCCACT 
GCTTGAATTA GATCCCTGCA 
GTAATCACTT CATGAATGCT 
TTTGTTTGAC TAATTCTGGA 
ATGTTTCCCA AACTGTGAGG 
CAAAATGGTG CTTTGAGGGT 
TGTGTTATGT GCCTATCCTA 



PCT/US02/12476 



CTGCCCAGGT 
TCACTTGGAG 
GGGAGACTCT 
ACATCTCAAA 
CTCATTCCTG 
GGATGCAGGA 
AGTTAT CGAC 
TCAACAGCTT 
ACACCTAAGC 
TACGACGTTA 
GGGAAGTGGG 
CAGTGGTGGA 
GGCAAAAAAG 
GGATGAACTG 
TCATCACAAG 
AT CATTAGGT 
AACAGAGATG 
TAACATAGGA 
AAAACAGGAA 
CCATCACCTT 
GTCTCTACTT 
CTAAAAATAG 
CATACTAGAT 
TGGTCTGTTC 
TGTGCTGTTG 
ATTCCTCTGA 
AAGGCTTGCT 
AAATGAGAAT 
ATTACAAGAT 
AGGGAAGGCT 
CAGCCTTTAG 
ATAAACTCTT 



GACCTGTTCA 
ATGGACACCA 
TGGAAAAAAC 
GCAGACAATG 
AATTTCAGGT 
GGACAATTCC 
AATG CAT TAG 
GGCTTCCAGG 
GTCATCGTCA 
TGTTTGGGTA 
CTGCGGTCAC 
GGAGCAAGGC 
TGGAATTAAA 
AGTTTAAAAG 
CCCTTGTTTG 
ACTTTTGTTT 
AGATTTGACA 
AAGCCTTTCC 
AACACAGCTT 
GAACAATAGC 
CGGCTGCAAA 
AGATGATAAT 
TCCTGAGACA 
TTGTAGATAA 
CTCTTATCTG 
GCTGAAGTTC 
CTGTGATGTC 
GTAAGTATTT 
TTCTATGCAG 
CAGAGATCGA 
GAAGGTGCAG 
AAACACATT 



Seq ID NO: 345 Protein sequence 
Protein Accession #: NP 036204 



11 



MATSMGLLLL 
ATVKSKEEAQ 
EDTPYSNWHK 
KFSFKGMCRP 
KEKAPDVFDW 
ASRNPCSSSP 
TPGGFRCECW 
DGTQCQDVDE 
PDEEDKGEKE 
SGVWREPSIH 
LGLLVYRKRR 



LLLLLTQPGA 
HVQRVLAQLL 
ELRNSCISKR 
LALGGPGQVT 
GSSGPLCVSP 
CRGGATCVLG 
VGYEPGGPGE 
CVGPGGPLCD 
GSTVPRAATA 
HATAASGPQE 
AKREEKKEKK 



21 
I 

GTGADTEAW 
RREAALTARM 
CVSLLLDLSQ 
YTTPFQTTSS 
KYGCNFNNGG 
PHGKNYTCRC 
GACQDVDECA 
SLCFNTQGSF 
SPTRGPEGTP 
PAGGDSSVAT 
PQNAADSYSW 



31 
I 

CVGTACYTAH 
SKFWIGLQRE 
PLLPNRLPKW 
SLEAVPFASA 
CHQDCFEGGD 
PQGYQLDSSQ 
LGRSPCAQGC 
HCGCLPGWVL 
KATPTTSRPS 
QNNDGTDGQK 
VPERAESRAM 



GCAG CAGAAC 


AAGCCAGGGC 


4860 


AGACAATGAA 


GATTTGTTGT 


4920 


TGAATATATT 


^mmm mm. _--_ — _ — jmm— *-mm -mm, -mm j—m 

CAGGACCAAC 


4980 


TAAAGAGAGA 


ACATCTCACA 


5040 


GCCATCACTG 


CTCTTTCTTT 


5100 


CACAGATAAT 


CTGAGGAATG 


5160 


AACTTGGTGA 


GCATCCTCTG 


5220 


CAAGACCAAC 


CACATCTGGT 


5280 


TTGCCATAGC 


_ _____ — _ , - , _ _ _ jm-L 

ATCATGATGC 


5340 


ATGTGGGGAT 


GAACTGCATG 


5400 


TGTCGGCCTT 


GCAAGGCCAC 


5460 


TTCAGGAAGG 


GCCAGCCACA 


5520 


AAGTCAAACC 


TTTATATGCA 


5580 


AATTTTTTTT 


TCTCTTCAAG 


5640 


AGTGTCTTAT 


CCCTGAGCAA 


5700 


CAACCTTTAT 


TCCTGTAAAT 


r-> <t"> A~ f> 

5760 


AAAAAAAATT 


GAATTAAAAA 


5820 


TATTATTTCT 


CTTCTTAGCT 


5880 


TCTAGCAGCT 


GCAAAATGGT 


5940 


TTTAGCTTGG 


GAATCTGAGA 


6000 


mmt — i _— mm* _*' mm jm%m m ■ ■ i 

ACCCATGGTT 


TAAATCTATA 


6060 


CCGAATTCTC 


_Hto _ J| ■ > to 4L #_to fM| mm* 

CATATATTCA 


6120 


AATACTCACT 


>»to — —1 — _. _— *M _— — 4 _^_ 4 «M 

GAAGGGCTTG 


6180 


TGCCCTTCTA 


TTTTAGGTAG 


6240 


CAAGGTGGCA 


AGCAGTTCTT 


6300 


TTTGCATAGA 


TTTGGCTTAA 


6360 


AGATGTAATT 


GTAAATGTCA 


6420 


TTAAATGTGT 


GTATTTCAAA 


" 6480 


GATTTACCTT 


CATCCTGTGC 


6540 


GCTTCTCCTC 


TGAGTTCTAA 


6600 


CTTTGTTGTC 


CTTTGAGCTT 


6660 


41 

i 


51 
i 




1 

SGKLSAAEAQ 


1 

NHCNQNGGNL 


_-" m—\ 

60 


KGKCLDPSLP 


LKGFSWVGGG 


120 


SEGPCGSPGS 


PGSNIEGFVC 


180 


ANVACGEGDK 


DETQSHYFLC 


240 


GSFLCGCRPG 


FRLtLDDLVTC 


3 00 


LDCVDVDECQ 


DSPCAQECVN 


360 


TNTDGSFHCS 


CEEGYVLAGE 


420 


APNGVSCTMG 


PVSLGPPSGP 


480 


LSSDAPITSA 


PLKMLAPSGS 


540 


LLLFYILGTV 


VAILLLLALA 


600 


ENQYSPTPGT 


DC 





Seq ID NO: 346 DNA sequence 
Nucleic Acid Accession #: Z31560 
Coding sequence: <l-966 



75 



CACAGCGCCC 
ACTTCGGGGG 
AGCCCGGACC 
CGCAAGATGG 
GCCGAGTGGA 
CTGCGAGCGC 
AAGACGCTCA 
AATAGCATGG 
ATGGACAGTT 
CAGCTGGGCT 
ATGCACCGCT 
ATGAACGGCT 
CTTGGCTCCA 
TCTTCCTCCC 
TATCTCCCCG 
CACTACCAGA 
ATGTGAGGGC 
TGGGAGGGGT 
AAAAA 



11 
I 

GCATGTACAA 
GCGGCGGCGG 
GCGTCAAGCG 
CCCAGGAGAA 
AACTTTTGTC 
TGCACATGAA 
TGAAGAAGGA 
CGAGCGGGGT 
ACGCGCACAT 
ACCCGCAGCA 
ACGACGTGAG 
CGCCCACCTA 
TGGGTTCGGT 
ACTCCAGGGC 
GCGCCGAGGT 
GCGGCCCGGT 
CGGACAGCGA 
GCAAAAGAGG 



21 



CATGATGGAG 
CAACTCCACC 
GCCCATGAAT 
CCCCAAGATG 
GGAGACGGAG 
GGAG CACCCG 
TAAGTACACG 
CGGGGTGGGC 
GAACGGCTGG 
CCCGGGCCTC 
CGCCCTGCAG 
CAGCATGTCC 
GGTCAAGTCC 
GCCCTGCCAG 
GCCGGAACCC 
GCCCGGCACG 
ACTGGAGGGG 
AGAGTAAGAA 



31 

t 

ACGGAGCTGA 
GCGGCGGCGG 
GCCTTCATGG 
CACAACT CGG 
AAGCGGCCGT 
GATTATAAAT 
CTGCCCGGCG 
GCCGGCCTGG 
AGCAACGGCA 
AATGCGCACG 
TACAACTCCA 
TACTCGCAGC 
GAGGCCAGCT 
GCCGGGGACC 
GCCGCCCCCA 
GCCATTAACG 
GGAGAAATTT 
ACAGCATGGA 



41 

I 

AGCCGCCGGG 
CCGGCGGCAA 
TGTGGTCCCG 
AG AT CAGCAA 
TCATCGACGA 
ACCGGCCCCG 
GGCTGCTGGC 
GCGCGGGCGT 
GCTACAGCAT 
GCGCAGCGCA 
TGACCAGCTC 
AGGGCACCCC 
CCAGCCCCCC 
TCCGGGACAT 
GCAGACTTCA 
GCACACTGCC 
TCAAAGAAAA 
GAAAACCCGG 



51 



CCCGCAGCAA 
CCAGAAAAAC 
CGGGCAGCGG 
GCGCCTGGGC 
GGCTAAGCGG 
GCGGAAAACC 
CCCCGGCGGC 
GAACCAGCGC 
GATGCAGGAC 
GATGCAGCCC 
GCAGACCTAC 
TGGCATGGCT 
TGTGGTTACC 
GATCAGCATG 
CATGTCCCAG 
CCTCTCACAC 
ACGAGGGAAA 
TACGCTCAAA 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
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Seq ID NO: 347 Protein sequence 
Protein Accession #: CAA83435 



1 

HSARMYNMME 
RKMAQENPKM 
KTLMKKDKYT 
QLGYPQHPGL 
LGSMGSWKS 
HYQSGPVPGT 



11 
1 

TELKPPGPQQ 
HNSEISKRLG 
LPGGLLAPGG 
NAHGAAQMQP 
EASSSPPWT 
AINGTLPLSH 



21 
1 

TSGGGGGNST 
AEWKLLSETE 
NSMASGVGVG 
MHRYDVSALQ 
SSSHSRAPCQ 
M 



31 
I 

AAAAGGNQKN 
KRPFIDEAKR 
AGLGAGVNQR 
YNSMTSSQTY 
AGDLRDMISM 



41 
I 

SPDRVKRPMN 
LRALHMKEHP 
MDSYAHMNGW 
MNGSPTYSMS 
YLPGAEVPEP 



51 



AFMVWSRGQR 60 

DYKYRPRRKT 120 

SNGSYSMMQD 180 

YSQQGTPGMA 240 

AAPSRLHMSQ 300 
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Seq ID NO: 348 DNA sequence 
Nucleotide Accession #: NM_002638 
Coding sequence: 120-473 



1 
I 

CAATACAGCT 
GCTGGACTGC 
TGAGGGCCAG 
AGGCAGCTGT 
TCAATGGACA 
CGCAAGAGCC 
TCCGGTGCGC 
TCAAGAAGTG 
CGGTCCTTGC 
TGCTGCCCTT 
GAGCTGCCTC 



11 

I 

AAGGAAT TAT 
ATAAAGATTG 
CAGCTTCTTG 
CACGGGAGTT 
AGATCCCGTT 
AGTCAAAGGT 
CATGTTGAAT 
CTGTGAAGGC 
TGCACCTGTG 
CCCCTTCCCA 
TCTCATCCAC 



21 

[ 

CCCTTGTAAA 
GTATGGCCTT 
ATCGTGGTGG 
CCTGTTAAAG 
AAAGGACAAG 
CCAGTCTCCA 
CCCCCTAACC 
TCTTGCGGGA 
CCGTCCCCAG 
CACTGT CCAT 
TTTCCAATAA 



31 
I 

TACCACAGAC 
AGCTCTTAGC 
TGTTCCTCAT 
GTCAAGACAC 
TTTCAGTTAA 
CTAAGCCTGG 
GCTGCTTGAA 
TGGCCTGTTT 
AGCTACAGGC 
TCTTCCTCCC 
A 



41 
I 

CCGCCCTGGA 
CAAACACCTT 
CGCTGGGACG 
TGTCAAAGGC 
AGGTCAAGAT 
CTCCTGCCCC 
AGATACTGAC 
CGTTCCCCAG 
CCCATCTGGT 
ATTCAGGATG 



51 

I 

GCCAGGCCAA 
CCTGACACCA 
CTGGTTCTAG 
CGTGTTCCAT 
AAAGTCAAAG 
ATTATCTTGA 
TGCCCAGGAA 
TGAAGGGAGC 
CCTAAGTCCC 
CCCACGGCTG 



Seq ID NO : 34 9 Protein sequence: 
Protein Accession NP 002629 



11 



21 



31 



41 



51 



1 

III!! 
MRASSFLIW VFLIAGTLVL EAAVTGVPVK GQDTVKGRVP FNGQDPVKGQ VSVKGQDKVK 

AQEPVKGPVS TKPGSCPIIL IRCAMLNPPN RCLKDTDCPG IKKCCEGSCG MACFVPQ 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
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Seq ID NO: 350 DNA sequence 
Nucleic Acid Accession #: NM_007183 
Coding sequence: 75-2468 
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GAATTCCGGA 
GTGGACCTGC 
GCGTGTGCTC 
CGGAGGCCGA 
AGCTGGGACA 
CCAGAGGCAC 
AGGGCCTGAG 
CAGCCTCCTG 
CCCACAATGG 
CCATGCCCAC 
ATGACACACT 
GCCTGGTGTC 
AGCGCCAGGC 
AGGTTTCCCC 
GCAGCCACCG 
CTCGAGCGCC 
ACGTGCATGG 
TTGATGACAT 
AGGTGCTGGG 
AGGCCCGCAG 
AAGTGCAGCG 
AGCTGGCCCT 
ATGATGAGCT 
TGAAGGACCG 
TGTCGGGGGC 
ACAACGCCAC 
TGCGGGAGTG 
CGGGCAAATG 
ACCGCCTCTA 
GGGACCTGGC 
GGCTGCGCGA 
CCAAGGGCCT 
AGCGCTGCGA 
CGGCAGGCGA 
TTCTGAACCC 
CTGGCCTCAT 
TGGTGAGCCA 
AGGTGCTGGT 
CCCGAGACCT 
ACAGCCCCGA 
AG T ACAAC AA 
GCC CAT AGGT 
T CAGCTCC AG 
TCGCTGGGGC 
ATAGCTGGGG 
TGTATGGGGT 
ATCTTGGGAT 
AAAAGGAATT 



11 

I 

CAGGACGTGA 
CGCCATG CAG 
CCTGGCGCTG 
GCGGCTGCGG 
GCAGCCGCGG 
ATCCAGGGGG 
TGGGGACAAG 
GTCCTCCCGC 
GGGCAGCGCC 
CAGGCCCGTG 
CTCCCTGCGC 
TGAGCAGCTG 
CAGCTCCAGC 
GAGCCGGACC 
GAGCCGCGGG 
ATCTGTGCGC 
GTTCAACAGC 
TGACCTGCCC 
AGCGGCCTAC 
CCTTCAGGCC 
CCATGCCACA 
GGTGGAGGAG 
TCGCAAAAAT 
CCTGGCCAGA 
TGGGGGTCCC 
CGGCTTCCTC 
CCACGGGCTG 
CGAGGACAAG 
CGACGAGATG 
GGGGGCGCCG 
GCTGCCCCTC 
CGAGTGGCTG 
GCTCAACCGG 
CCGCAGGTGG 
CCTGCTAGAC 
CCGAAACCTG 
CCTGATCGAG 
C AA CAT CAT A 
GCTGTATTTT 
CAGTGAGAAG 
GCTCCACCGT 
GAAGCCTTCT 
GCTGCTTGGC 
CCCTGTGTGC 
ACTTGGCTTC 
GGTGACCCAG 
AGCCAGCACT 
C 



21 

I 

AGATAGTTGG 
GACGGTAACT 
CCCTCTGACC 
GCAGCCCGCG 
CACAACGGGG 
CAGTACCACA 
ACCTCGGGCT 
TCCGCCGTGG 
TTTGGGGCCG 
TCCTTCCATG 
TCGCTGCGGC 
GAGCCCGCGG 
TCCAGCCGGG 
ATCCGTGCCC 
GTAGGCGGGG 
AGCCTCAGCC 
TACGGTAGCC 
TCAGCAGTCA 
ATCCAGCACA 
GTGCCTAGGC 
GGTGCCATGC 
AACGGGATCT 
GTCACAGGGA 
GACACGCTGG 
CCCCTCATCC 
AGGAACCTCA 
GTGGACGCCC 
AGCGTGGAGA 
CCGCCGTCCG 
CCGGGAGAGG 
GCCGCCGATG 
TGGAGCCCCC 
CACACGACGG 
GCGGGGGTGC 
CGTGT CAGG A 
TCTCGGAACG 
AAGCTGCCAG 
GCTGTGCTCA 
GACGGACTCC 
TCCTCCCGGG 
GACTTTCGGG 
GGAGGAGAAG 
AGCCCAGCCT 
ATCTTTGAGG 
CGCAGGGCAG 
TCACATTGGC 
GGGAATAAAG 



31 
I 

GTTTGGAGGC 
TCCTGCTGTC 
TGCAGCTGGA 
TCCAGGAGCA 
CCGCTGAGCC 
CCCTGCAGGC 
TCCGGCCCAT 
ATCTGAGCTG 
CTGGGTACGG 
AGCGCGGTGG 
TGGGGCCCGG 
CCACCTCCAC 
CAGGGGGGCT 
CTGCCGTGCG 
CAGTGCCGGG 
TCAGCCTGGC 
ACCGAACCCT 
AGTACCTCAT 
AGTGCTACAG 
TGGTGAAGCT 
GCAACCTCAT 
TCGAGCTGCT 
TCCTGTGGAA 
AGCAGCTCAC 
AGCAGAACGC 
GCTCAGCCTC 
TGGTCACCTC 
ACGCGGTGTG 
CGCTGCAGCG 
TCGTGGGCTG 
CGCTCACCTT 
AGATCGTGGG 
AGGCGGCCGC 
TGAGCCGCCT 
CCGCCGACCA 
CTAGGAACAA 
GCAGCGTGGG 
ACAACCTGGT 
GAAAGCTCAT 
CAGCATCCAG 
CGAAGGGCTA 
GTGACGTGGC 
GGAGGAGAAG 
GTCCTGGGCC 
GGGGTGGGGC 
AGAGGTGGGG 
ATGGCCATGA 



41 
I 

GGCCGCCAGG 
GGCCCTGCAG 
CCGCCGGGGC 
GGTCCGCGCC 
CGAGCCTGAG 
TGGCTTCAGC 
CGCCAAGCCG 
CAGTCGGAGG 
GGGTGCCCAG 
GGTTGGGAGC 
GGGCCTGGAC 
CTACAGGGCC 
GGACTGGCCC 
GACCCTGCAG 
GGCCGTCCTG 
TGACTCGGGC 
GCAGAGACTC 
GGCTTCAGAC 
CGATGCAGCC 
CTTCAACCAC 
CTACGACAAC 
GCGGACACTG 
CCTTTCATCC 
GGACCTGGTG 
CTCGGAGGCG 
TCAGGCCACT 
TATCAACCAC 
CGTCCTGCGG 
GCTGGAGGGT 
CTTCACGCCG 
CGCGGAGGTG 
GCTGTACAAC 
CGGGGCGCTG 
GGCCCTGGAG 
CCACCAGCTG 
GGACGAGATG 
TGAGAAGTCG 
GGTGGCCAGC 
CTTCAT CAAG 
CCTCCTGGCC 
TCGGAAGGAG 
CCAGCGTCCA 
GCTAATGACG 
ACCAGGAGGG 
AGGGCTCAAG 
GTTGGCTGTG 
ACAGTCACAA 



51 
I 

CCCAGGCCCG 60 

CCTGAGGCCG 120 

GCCGAGGGGC 180 

CGCCTCTTGC 240 

GCCGAGACTG 300 

TCTCGCTCTC 360 

GCCTACAGCC 42 0 

CTGAGTTCAG 480 

CCCACCCCTC 540 

CGGGCCGACT 600 

GACCGCTACA 660 

TTTGCGTACG 720 

GAGGCCACTG 780 

CGATTCCAGA 840 

GAG CCAGTGG 900 

CACCTGCCGG 960 

AGCAGCGGTT 102 0 

CCCAACCTGC 1080 

GCCAAGAAGC 1140 

GCCAACCAGG 12 00 

GCTGACAACA 12 60 

CGGGAGCAGG 1320 

AGCGACCACC 13 80 

TTGAGCCCCC 1440 

GAGATCTTCT 1500 

CGCCAGAAGA 1560 

GCCCTGGACG 1620 

AACCTGTCCT 1680 

CGCGGCCGCA 1740 

CAGAGCCGGC 1800 

TCCAAGGACC 1860 

CGGCTGCTGC 1920 

CAG AA CATC A 1980 

CAGGAGCGTA 2040 

CGCTCACTGA 2100 

TCCACGAAGG 2160 

CCCCCAGCCG 2220 

CCCATCGCTG 2280 

AAGAAGCGGG 2340 

AACCTGTGGC 2400 

GACTTCCTGG 2460 

AGGGACAGAC 2520 

GAGGGGCCCC 2580 

GCAGGGTCTT 2640 

GCTGCTCTGG 2700 

GCCTGGCAGT 2760 

AAAAAAAAAA 2820 



85 



Seq ID NO: 351 Protein sequence 
Protein Accession #: NP 009114.1 



11 



21 



31 



41 



51 



318 



WO 02/086443 

I I I 

MQDGNFLLSA LQPEAGVCSL ALPSDLQLDR 

PRHNGAAEPE PEAETARGTS RGQYHTLQAG 

SRSAVDLSCS RRLSSAHNGG SAFGAAGYGG 

LRSLRLGPGG LDDRYSLVSE QLEPAATSTY 

RTIRAPAVRT LQRFQSSHRS RGVGGAVPGA 

NSYGSHRTLQ RLSSGFDDID LPSAVKYLMA 

QAVPRLVKLF NHANQEVQRH ATGAMRNLIY 

KNVTGILWNL SSSDHLKDRL ARDTLEQLTD 

FLRNLSSASQ ATRQKMRECH GLVDALVTSI 

EMPPSALQRL EGRGRRDLAG APPGEWGCF 

WLWSPQIVGL YNRLLQRCEL NRHTTEAAAG 

LDRVRTADHH QLRSLTGLIR NLSRNARNKD 

I I AVLNNLW ASPIAARDLL YFDGLRKLIF 

HRDFRAKGYR KEDFLGP 



I i 1 

RGAEGPEAER LRAARVQEQV RARLLQLGQQ 

FSSRSQGLSG DKTSGFRPIA KPAYSPASWS 

AQPTPPMPTR PVSFHERGGV GSRADYDTLS 

RAFAYERQAS SSSSRAGGLD WPEATEVSPS 

VLEPVARAPS VRSLSLSLAD SGHLPDVHGF 

SDPNLQVLGA AYIQHKCYSD AAAKKQARSL 

DNADNKLALV EENGIFELLR TLREQDDELR 

LVLSPLSGAG GPPLIQQNAS EAEIFYNATG 

NHALDAGKCE DKSVENAVCV LRNLSYRLYD 

TPQSRRIiREL PLAADALTFA EVSKDPKGLE 

ALQNITAGDR RWAGVLSRLA LEQERILNPL 

EMSTKWSHL IEKLPGSVGE KSPPAEVLVN 

IKKKRDSPDS EKSSRAASSL LANLWQYNKL 



Seq ID NO: 3 52 DNA sequence 
Nucleic Acid Accession #: M31469 
Coding sequence : 1-651 

1 11 21 31 41 51 

! I I I I I 

ATGGCTGCGC AGGGAGAGCC CCAGGT CCAG TTCAAACTTG TATTGGTTGG TGATGGTGGT 
ACTGGAAAAA CGACCTTCGT G AAACGT CAT TTGACTGGTG AATT TGAGAA GAAGTATGTA 
GCCACCTTGG GTGTTGAGGT TCATCCCCTA GTGTT CCACA CCAACAGAGG ACCTATTAAG 
TTCAATGTAT GGGACACAGC CGGCCAGGAG AAATTCGGTG GACTGAGAGA TGGCTATTAT 
ATCCAAGCCC AGTGTGCCAT CATAATGTTT GATGTAACAT CGAGAGTTAC TTACAAGAAT 
GTGCCTAACT GGCATAGAGA TCTGGTACGA GTGTGTGAAA ACATCCCCAT TGTGTTGTGT 
GG C AACAAAG TGGATATTAA GGACAGGAAA GTGAAGGCGA AATCCATTGT CTTCCACCGA 
AAGAAGAATC TTCAGTACTA CGACATTTCT GCCAAAAGTA ACTACAACTT TGAAAAGCCC 
TTCCTCTGGC TTGCTAGGAA GCTCATTGGA GACCCTAACT TGGAATTTGT TGCCATGCCT 
GCTCTCGCCC CACCAGAAGT TGTCATGGAC CCAGCTTTGG CAGCACAGTA TGAGCACGAC 
TTAGAGGTTG CTCAGACAAC TGCTCTCCCG GATGAGGATG ATGACCTGTG A 

Seq ID NO: 353 Protein sequence 
Protein Accession #: AAA36546 

1 11 21 31 41 51 

I l l l l l 

MAAQGEPQVQ FKLVLVGDGG TGKTTFVKRH LTGEFEKKYV ATLGVEVHPL VFHTNRGP I K 

PNVWDTAGQE KFGGLRDGYY IQAQCAIIMF DVTSRVTYKN VPNWHRDLVR VCENIPIVLC 

GNKVD I KDRK VKAKS I VFHR KKNLQYYDIS AKSNYNFEKP FLWLARKLIG DPNLEFVAMP 

ALAPPEWMD PALAAQYEHD LEVAQTTALP DEDDDL) 



Seq ID NO: 354 DNA sequence 
Nucleic Acid Accession #: NM_002820 
Coding sequence: 304-831 

1 11 21 31 41 51 

I I I l I l 

CCGGTTCGCA AAGAAGCTGA CTTCAGAGGG GGAAACTTTC TTCTTTTAGG AGGCGGTTAG 
CCCTGTTCCA CGAACCCAGG AGAACTGCTG GCCAGATTAA TTAGACATTG CTATGGGAGA 
CGTGTAAACA CACTACTTAT CATTGATGCA TATATAAAAC CATTTTATTT TGGCTATTAT 
TTCAGAGGAA GCGCCTCTGA TTTGTTTCTT TTTTCCCTTT TTGCTCTTTC TGGCTGTGTG 
GTTTGGAGAA AGCACAGTTG GAGTAG CCGG TTGCTAAATA AGTCCCGAGC GCGAGCGGAG 
ACGATGCAGC GGAGACTGGT TCAGCAGTGG AGCGTCGCGG TGTTCCTGCT GAGCTACGCG 
GTGCCCTCCT GCGGGCGCTC GGTGGAGGGT CTCAGCCGCC GCCTCAAAAG AGCTGTGTCT 
GAACATCAGC TCCTCCATGA CAAGGGGAAG TCCATCCAAG ATTTACGGCG ACGATTCTTC 
CTTCACCATC TGAT CGCAGA AATCCACACA GCTGAAATCA GAG CT AC CT C GGAGGTGTCC 
CCTAACTCCA AGCCCTCTCC CAACACAAAG AACCACCCCG TCCGATTTGG GTCTGATGAT 
GAGGGCAGAT ACCTAACTCA GGAAACTAAC AAGGTGGAGA CGTACAAAGA GCAGCCGCTC 
AAGACACCTG GGAAGAAAAA GAAAGGCAAG CCCGGGAAAC GCAAGGAGCA GGAAAAGAAA 
AAACGGCGAA CTCGCTCTGC CTGGTTAGAC TCTGGAGTGA CTGGGAGTGG GCTAGAAGGG 
GACCACCTGT CTGACACCTC CACAACGTCG CTGGAGCTCG ATTCACGGTA ACAGGCTTCT 
CTGGCCCGTA GCCTCAGCGG GGTGCTCTCA GCTGGGTTTT GGAGCCTCCC TTCTGCCTTG 
GCTTGGACAA ACCTAGAATT TTCTCCCTTT ATGTATCTCT ATCGATTGTG TAGCAATTGA 
CAGAGAATAA CTCAGAATAT TGTCTGCCTT AAAGCAGTAC CCCCCTACCA CACACACCCC 
TGTCCTCCAG CACCATAGAG AGGCGCTAGA GCCCATTCCT CTTTCTCCAC CGTCACCCAA 
CATCAATCCT TTACCACTCT ACCAAATAAT TTCATATTCA AGCTTCAGAA GCTAGTGACC 
AT CTTCATAA TTTGCTGGAG AAGTGTATTT CTTCCCCTTA CTCTCACACC TGGGCAAACT 
TTCTTCAGTG TTTTTCATTT CTTACGTTCT TTCACTTCAA GGGAGAATAT AGAAGCATTT 
GATATTATCT ACAAACACTG C AG AACAG C A T CATGT CAT A AACGATTCTG AGCCATTCAC 
ACTTTTTATT TAATTAAATG TATTTAATTA AATCTCAAAT TTATTTTAAT GTAAAGAACT 
TAAATTATGT TTTAAACACA TGCCTTAAAT TTGTTTAATT AAATTTAACT CTGGTTTCTA 
CCAGCTCATA CAAAATAAAT GGTTTCTGAA AATGTTTAAG TATTAACTTA CAAGGATATA 
GGTTTTTCTC ATGTATCTTT TTGTTCATTG GCAAGATGAA ATAATTTTTC TAGGGTAATG 
CCGTAGGAAA AATAAAACTT CACAT T T AAA AAAAA 

Seq ID NO: 355 Protein sequence 
Protein Accession #: NM__ 002820 

1 11 21 31 41 51 

I i I l I I 

MQRRLVQQWS VAVFLLSYAV PSCGRSVEGL SRRLKRAVSE HQLLHDKGKS IQDLRRRFFL 
HHLIAEIHTA EIRATSEVSP NSKPSPNTKN HPVRFGSDDE GRYLTQETNK VETYKEQPLK 



319 



WO 02/086443 

TPGKKKKGKP GKRKEQEKKK RRTRSAWLDS GVTGSGLEGD HLSDTSTTSL ELDSR 



Seq ID NO: 356 DNA sequence 
Nucleic Acid Accession #: NM_017522 
Coding sequence: 1-2100 



1 11 21 31 41 51 

I I I I I I 

ATGGGCCTCC CCGAGCCGGG CCCTCTCCGG CTTCTGGCGC TGCTGCTGCT GCTGCTGCTG 60 

CTGCTGCTGC TGCGGCTCCA GCATCTTGCG GCGGCAGCGG CTGATCCGCT GCTCGGCGGC 120 

CAAGGGCCGG CCAAGGAGTG CGAAAAGGAC CAATTCCAGT GCCGGAACGA GCGCTGCATC 180 

CCCTCTGTGT GGAGATGCGA CGAGGACGAT GACTGCTTAG ACCACAGCGA CGAGGACGAC 240 

TGCCCCAAGA AGACCTGTGC AGACAGTGAC TTCACCTGTG ACAACGGCCA CTGCATCCAC 300 

GAACGGTGGA AGTGTGACGG CGAGGAGGAG TGTCCTGATG GCTCCGATGA GTCCGAGGCC 360 

ACTTGCACCA AGCAGGTGTG TCCTGCAGAG AAGCTGAGCT GTGGACCCAC CAGCCACAAG 420 

TGTGTACCTG CCTCGTGGCG CTGCGACGGG GAGAAGGACT GCGAGGGTGG AGCGGATGAG 480 

GCCGGCTGTG CTACCTCACT GGGCACCTGC CGTGGGGACG AGTT CCAGTG TGGGGATGGG 540 

ACATGTGTCC TTGCAATCAA GCACTGCAAC CAGGAGCAGG ACTGTCCAGA TGGGAGTGAT 600 

GAAGCTGGCT GCCTACAGGG GCTGAACGAG TGTCTGCACA AC AATGG CGG CTGCTCACAC 660 

ATCTGCACTG ACCTCAAGAT TGGCTTTGAA TGCACGTGCC CAGCAGGCTT CCAGCTCCTG 720 

GACCAGAAGA CTTGTGGCGA CATTGATGAG TGCAAGGACC CAGATGCCTG CAGCCAGATC 780 

TGTGTCAATT ACAAGGGCTA TTTTAAGTGT GAGTGCTACC CTGGCTGCGA GATGGACCTA 840 

CTGACCAAGA ACTGCAAGGC TGCTGCTGGC AAGAGCCCAT CCCTAATCTT CACCAACCGC 900 

ACGAGTGCGG AGGATCGACC TGTGAAGCGG AACTATTCAC GCCTCATCCC CATGCTCAAG 960 

AATGTCGTGG CACTAGATGT GGAAGTTGCC ACCAATCGCA TCTACTGGTG TGACCTCTCC 1020 

TACCGTAAGA TCTAT AG CGC CTACATGGAC AAGGCCAGTG ACCCGAAAGA GCGGGAGGTC 1080 

CTCATTGACG AGCAGTTGCA CTCTCCAGAG GGCCTGGCAG TGGACTGGGT CCACAAGCAC 1140 

AT CTACTGG A CTGACTCGGG CAATAAGACC AT CTCAGTGG CCACAGTTGA TGGTGGCCGC 1200 

CGACGCACTC TCTTCAGCCG TAACCTCAGT GAACCCCGGG CCATCGCTGT TGACCCCCTG 1260 

CGAGGGTTCA TGTATTGGTC TGACTGGGGG GACCAGGCCA AGATTGAGAA ATCTGGGCTC 1320 

AACGGTGTGG ACCGGCAAAC ACTGGTGTCA GACAATATTG AATGG C C CAA CGGAATCACC 1380 

CTGGATCTGC TGAGCCAGCG CTTGTACTGG GTAGACTCCA AGCTACACCA ACTGTCCAGC 1440 

ATTGACTTCA GTGGAGGCAA CAGAAAGACG CTGATCTCCT CCACTGACTT CCTGAGCCAC 1500 

CCTTTTGGGA TAGCTGTGTT TGAGGACAAG GTGTTCTGGA CAGACCTGGA GAACGAGGCC 1560 

ATTTTCAGTG CAAATCGGCT CAATGGCCTG GAAATCTCCA TCCTGGCTGA GAACCTCAAC 162 0 

AACCCACATG ACATTGT CAT CTTCCATGAG CTGAAGCAGC CAAGAGCTCC AGATGCCTGT 1680 

GAGCTGAGTG TCCAGCCTAA TGGAGGCTGT GAATACCTGT GCCTTCCTGC TCCTCAGATC 1740 

TCCAGCCACT CTCCCAAGTA CACATGTGCC TGTCCTGACA CAATGTGGCT GGGTCCAGAC 1800 

ATGAAGAGGT GCTA CCGAGA TGCAAATGAA GACAGTAAGA TGGGCTCAAC AGTCACTGCC 1860 

GCTGTTATCG GGAT CATCGT GCCCATAGTG GTGATAGCCC TCCTGTGCAT GAGTGGATAC 192 0 

CTGATCTGGA GAAACTGGAA G CGGAAGAAC ACCAAAAGCA TGAATTTTGA CAACCCAGTC 1980 

TACAGGAAAA CAACAGAAGA AGAAGATGAA GATGAGCTCC ATATAGGGAG AACTGCTCAG 2040 

ATTGGCCATG TCTATCCTGC ACGAGTGGCA TTAAGCCTTG AAGATGATGG ACTACCCTGA 2100 

GGATGGGATC ACCCCCTTCG TGCCTCATGG AATTCAGTCC CATGCACTAC ACTCCGGATG 2160 

GTGTATGACT GGATGAATGG GTTTCTATAT ATGGGTCTGT GTGAGTGTAT GTGTGTGTGT 2220 

GATTTTTTTT TTTAAATTTA TGTTGCGGAA AGGTAACCAC AAAGTTATGA TGAACTGCAA 2280 

ACATCCAAAG GATGTGAGAG TTTTTCTATG TATAATGTTT TATACACTTT TTAACTGGTT 2340 

GCACTACCCA TGAGGAATTC GTGGAATGGC TACTGCTGAC TAACATGATG CACATAACCA 2400 

AATGGGGGCC AATGGCACAG TACCTTACTC AT CATTTAAA AACTATATTT ACAGAAGATG 24 60 

TTTGGTTGCT GGGGGGCTTT TTTAGGTTTT GGGCATTTGT TTTTTGTAAA TAAGATGATT 252 0 
ATGCTTTGTG GCTATCCATC AACATAAGT 



Seq ID NO: 357 Protein sequence 
Protein Accession #: NP_059992 

1 11 21 31 41 51 

I I I I ! 1 

MGLPEPGPLR LLALLLLLLL LLKLRLQHLA AAAADPLLGG QGPAKECEKD QFQCRNERCI 60 

PSVWRCDEDD DCLDHSDEDD CPKKTCADSD FTCDNGHCIH ERWKCDGEEE CPDGSDESEA 120 

TCTKQVCPAE KLSCGPTSHK CVPASWRCDG EKDCEGGADE AGCATSLGTC RGDEFQCGDG 180 

TCVLAIKHCN QEQDCPDGSD EAGCLQGI*NE CLHNNGGCSH ICTDLKIGFE CTCPAGFQLL 240 

DQKTCGDIDE CKDPDACSQI CVNYKGYFKC ECYPGCEMDL LTKNCKAAAG KSPSLIFTNR 3 00 

TSAEDRPVKR NYSRLIPMLK NWALDVEVA TNRIYWCDLS YRKIYSAYMD KASDPKEREV 3 60 

LIDEQLHSPE GLAVDWVHKH IYWTDSGNKT I SVATVDGGR RRTLFSRNLS EPRAIAVDPL*" 420 

RGFMYWSDWG DQAKIEKSGL NGVDRQTLVS DNIEWPNGIT LDLLSQRLYW VDSKLHQLSS 480 

IDFSGGNRKT LISSTDFLSH PFGIAVFEDK VFWTDLENEA IFSANRLNGL EISILAENLN 540 

NPHDIVIFHE LKQPRAPDAC ELSVQPNGGC EYLCLPAPQI SSHSPKYTCA CPDTMWLGPD 600 

MKRCYRDANE DSKMGSTVTA AVIGIIVPIV VIALLCMSGY LIWRNWKRKN TKSMNFDNPV 660 
YRKTTEEEDE DELHIGRTAQ IGHVYPARVA LSLEDDGLP 



Seq ID NO: 358 DNA sequence 
Nucleic Acid Accession #: M27826 
Coding sequence: <l-503 



1 11 21 31 41 51 

1 I I I 1 1 

AGCCCAAGAA ACATCTCACC AATTTCAAAT CTGATCTATT CGGCTTAGCG ACTGAAGATT 60 

GACGCTGCCC GATCGCCTCG GAAGTCCCCT GGACCATCAC AGAAGCCGAG CTTCGGGTAA 120 

CTCT CACAGT GGAGGGTAAG TCCATCCCCT GTTTAATCGA TACGGGGGCT ACCCACTCCA 180 

CGTTGCCTTC TTTTCAAGGG CCTGTTTCCC TTGCCCCCAT AACTGTTGTG GGTATTGACG 240 

GCCAAGCTTC AAAACCCCTG AAAACTCCCC CACTCTGGTG CCAACTTGGA CAACACTCTT 300 

TTATGCACTC TTTTTTAGTT ATCCCCACCT GCCCACTTCC CTTATTAGGC CGAAATATTT 360 

TAACCAAATT ATCTGCTTCC CTGACTATTC CTGGAGTACA GCTACATCTC ATTGCTGCCC 420 

TTCTTCCCAA TCCAAAGCCT CCTTTGTGTC CTCTAACATC CCCACAATAT CAGCCCTTAC 480 

CACAAGACCT CCCTTCAGCT TAATCTCTCC CACT CTAGGT TCCCACGCCG CCCCTAATCC 540 

CACTTGAAGC AGCCCTGAGA AACATCGCCC ATTCTCTCTC CATACCACCC CCCAAAAATT 600 

TTCGCCGCTC CAACACTTCA ACACTATTTT GTTTTATTTG TCTTATTAAT AT CAGAAGGC 660 



320 



WO 02/086443 

AGGAATGTCA GGCCTCTGAG 
ACATCCAGAT GGCCTGAAGT 
ATGACATTCC ACCATTGTGA 
ATCTCCCCCA CCCTTAAGAA 
TGAGATCCAC CCCTGCCCAC 
CCCAAATCCT ATAAAACAGC 
AGCCACCGGC ACCCAGGTGA 



PCT/US02/12476 



CCCAGGCCAG 
AACTGAAGAT 
TTTGTTCCTG 
GGTTCTTTGT 
CAGAGAACAA 
CCCACCCCTA 
AATAAACAGC 



GCCAT CGCAT 
CCACAAAAGA 
CCCCACCCTA 
AATTCTCCCC 
CCCCCTTTGA 
TCTTCCTTCA 
TTTATTGCTC 



CCCCTGTGAC 


TTGCACGTAT 


720 


AGTAAAAACA 


GCCTTAACTG 


780 


ACTGATCAAT 


GTACTTTGTA 


840 


ACCCTTGAGA 


ATGTACTTTG 


900 


TTGTAATTTT 


TTATTACCTT 


960 


CTGACTCTCT 


TTTCGGACTC 


1020 


AC 







10 



Seq ID NO: 359 Protein sequence 
Protein Accession #: AAA65999 



15 



20 



25 
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60 



65 



70 



75 



80 



1 11 21 31 41 51 

I I I I I I 

PKKHLTNFKS DLFGLATEDW RCPIASEVPW TITEAELRVT LTVEGKSIPC LIDTGATHST 

LPSFQGPVSL APITWGIDG QASKPLKTPP LWCQLGQHSF MHSFLVIPTC PLPLLGRNIL 

TKLSASLTIP GVQLHLIAAL LPNPKPPLCP LTSPQYQPLP QDLPSA 

Seq ID NO: 360 DNA sequence 
Nucleic Acid Accession #: NM_001854 
Coding sequence: 162-5582 



60 
120 



85 



1 
I 

AACCATCAAA 
TGTGTAGCAA 
TTCGTGGGTT 
GGTGGAAAAC 
TCTTCCAAGC 
TTCACAATTC 
CTAAAGGCTC 
AACAGTT AT T 
CAAAAAAAGG 
TTGGTGTTGA 
CCCCAGAAGA 
TAGCAATCAG 
CGAAACCACT 
GAACAAGGAT 
GTGATCCCAA 
CACCCAAGGC 
TCGAATATGA 
GACCCACTGT 
AAGAATACAA 
GGACAAATGA 
ATTATGATTC 
GCAGGGATTC 
AAGAATATGA 
CAGAAACTGA 
AGAAAGGAGA 
CAGGACCTGC 
ACCCTGGCGA 
GTCCTCCTGG 
CAACCATCTC 
TGAGAGGCCC 
GTTCATCTGG 
AGGGTCCCCC 
GAAGAGGAAT 
GTCTGCCAGG 
CTGGTGATGA 
AAGCTGGCCC 
GTATGGCAGG 
CTGGGCCTCC 
CAATTGGTCC 
GTGCTGATGG 
TGGGTCCCCC 
CAGATGGTGT 
GATTCAAAGG 
GAGGGNAAGA 
CTTCAGGTCA 
GAAGACAAGG 
AAGGTGCACG 
CTCGAGGTTC 
GTGGCGATGG 
TTGGATTCCC 
ACCCTGGGCA 
GAGTGGTTGG 
CTGGTCCTCC 
CAAAGGGTGA 
GTTTCCCAGG 
AAGGTCCCCA 
CAGCTGGCCC 
GAGAGAAAGG 
AAGGTCCTGT 
ACAAGGGTGA 
GCCCTCCCGG 
ATGGTGAACC 
CCAGAGGCTT 
GTGAAAAAGG 



11 
I 

TTTAGAAGAA 
ACATCCCTGG 
GAGTTCACAG 
GAAACGGTGG 
TAGAGAGGTC 
TCCAGAGGGA 
AGATACTGCT 
TCCAGGTGGA 
AATTCAGTCT 
GGTTGGGAGA 
CTATCCCCTC 
CGTGGAGAAG 
TGATAGAAGT 
TTTGGATGAA 
GGCAGCATAT 
TGCTCAAGCT 
CTATGAGTAT 
AACTGAGGAG 
CTATGGAACA 
GCCAAATCCA 
CCAGAGGAAA 
TGATCTTCTG 
AGATAAACCA 
TATTACAGAA 
ACCAGCAGTG 
AGGTATTATG 
TAGGGGCCCC 
TACTATGTTG 
TGCTCAGGAA 
ACCTGGCCCA 
GGCCAAAGGT 
TGGTCCAACG 
GCCAGGAGAA 
TGACAAAGGT 
TGGAATGAGG 
ACGAGGTTTG 
TGTAGATGGC 
AGGTCAACAA 
TCCTGGTGAA 
GCCTCCTGGT 
TGGT CCACAA 
CAGAGGTCTC 
TGACATGGGT 
TGGCCCTGAA 
AG CAGGAGAA 
TCCAAAGGGT 
GGGAGTAGCT 
AAGAGGTGCA 
CCCTCCTGGC 
TGGACCAAAA 
ACGTGGGGAG 
ACCACAGGGA 
TGGCCCTCCT 
TCCAGGTCCT 
GGAAAGAGGT 
GGGCCCACCA 
AATTGGTTTA 
TGCTCCTGGA 
TGGT CTCCCA 
AATTGGTGAG 
TCCCCCAGGT 
AGGTCCTAGA 
CCCTGGACCT 
TGAAAATGGG 



21 



AAAGCCCTTT 
CGATACCTTG 
TTGTGAGTGC 
CTCTGGGATT 
AGAGGAGCTG 
AT AT C AAAAA 
TACAGAGTTT 
ACTTTCCCAG 
TTCCTTTTAT 
T CACCTGTTT 
TTCAGAACTG 
AAAACTGTGA 
GAGAGAGCAA 
GAAGTTTTTG 
GACTACTGTG 
CAGGAACCTC 
GGGGAAGCAG 
ACAATAGCAC 
ATGGAAAGTT 
GTTGAAGAAA 
AAT TCTGAGG 
GTAGATGGAG 
ACAAGCCCCC 
ACAAGCATAA 
GTTGAGCCTG 
GGTCCTCCAG 
CCAGGACGTC 
ATGTTACCGT 
GCTCAGGCTC 
ATGGGTCTAA 
GAGAGTGGTG 
GGAAAACCTG 
CCTGGGGCAA 
CACAGGGGTG 
GGAGAAGATG 
CTGGGTCCAA 
CCCCCAGGAC 
GGGAATCCAG 
AAAGGACCAC 
CATCCTGGGA 
GGTCCTATTG 
AAGGGATCTA 
CTAAAAGGTG 
GGACCCAAAG 
AAGGGAAAAC 
TCCACTGGAT 
GGCAAACCAG 
AGAGGTCCCA 
CCTCCAGGTG 
GGCCCTCCTG 
ACTGGATTTC 
CCAACCGGTG 
GGTGAGCAAG 
CAAGGTATCT 
CTTCCTGGAG 
GGTCCAGTTG 
CGAGGGCGCC 
GAAAAAGGTC 
GGGCCAGCTG 
CCGGGACAAA 
CTTCAAGGAC 
GGACAGCAGG 
CCTGGTCCAA 
GATGTTGGTC 



31 
I 

GACTTTTTCC 
GAAAGGACGA 
GGGGCTCGGA 
TCACCGTAAC 
CTCCAGTTGA 
CAACGGGATT 
CAAAGCAAGC 
AAGACTTTTC 
CTATATATAA 
TTCTGTTTGA 
TTAACATCGC 
CAATGATTGT 
TTGTTGATAC 
AGGGGGACAT 
AGCATTATAG 
AGATAGATGA 
AGTATAAAGA 
AGACGGAGGC 
ACCAGACAGA 
TATTTACTGA 
ATACACTATA 
ATTTAGGCGA 
CTAATGAAGA 
ATGGCCATGG 
GTATGCTTGT 
GTCTACAAGG 
CTGGCTTACC 
TCCGTTATGG 
AAGCTATTCT 
CTGGAAGACC 
ATCCAGGTCC 
GAAAAAGGGG 
AGGGAG AT CG 
AACGAGGTCC 
GAGAAATTGG 
GGGGAACTCC 
CAAAAGGGAA 
GACCTCAGGG 
AAGGAAAACC 
AAGAAGGCCA 
GATNNCCGGG 
AAGGTGAAAA 
ACAGAGGAGA 
GTCGAGCAGG 
TTGGAGTTCC 
TCCCTGGGTT 
GCCCTCGGGG 
CTGGGAAACC 
AAAGAGGTCC 
GACCACCAGG 
AAGG CAAG AC 
AGACTGGT CC 
GTCTTCCTGG 
CAGGGAAAGA 
CTCAGGGTGC 
GCTCACCAGG 
CGGGACCTCA 
CCCAAGGGCC 
GTCCTGCCGG 
AAGGCAGCAA 
CAGTTGGTGC 
GGATGTTTGG 
TAGGTCTTCA 
CATGGGGGCC 



41 
I 

CCCTCTCCCT 
AGTTGGTCTG 
GATGGAGCCG 
AACCCTCGCA 
TGTACTAAAA 
TTGCACAAAC 
ACAACTCAGT 
AATACTATTT 
TGAGCATGGT 
AGACCACACT 
TGACGGGAAG 
TGATTGTAAG 
CAATGGAATC 
TCAGCAGTTT 
TCCAGACTGT 
GTATGCACCA 
GGCTGAAAGT 
AAACATCGTT 
AGCTCCTAGG 
AGAATATCTA 
TGAAAACAAA 
ATATGATTTT 
ATTTGGTCCA 
TGCATATGGA 
CGAAGGACCA 
CCCCACTGGA 
AGGGGCTGAT 
TGGTGATGGT 
TCAGCAGGCT 
AGGTCCTGTG 
TCAGGGCCCT 
TCGTCCAGGT 
AGGGTTTGAT 
TCAAGGTCCT 
ACCAAGAGGT 
AGGAGCTCCA 
CATGGGTCCC 
TCTTCCTGGT 
AGGACTTGCT 
GTCTGGAGAA 
CCCCCGGGGA 
GGGTGAAGAT 
AGTTGGTCAA 
CCCAACTGGA 
AGGATTACCA 
TCCAGGTGCC 
TCAGCGTGGT 
TGGGCCAAAG 
TCAAGGACCT 
AAGGATGGGC 
CGGCCCTCCT 
AATAGGGGAA 
TGCTGCAGGA 
TGGACCAGCA 
ACCTGGACTG 
AGAACGTGGG 
GGGTCCTCCT 
TGCAGGGAGA 
CTCCCCTGGG 
GGGTGGCAAG 
CCCTGGAATT 
GCAAAAAGGT 
GGGTCTGCCA 
ACCTGGTCCT 



51 



CCCCAATGGC 
CAGTCGCAAT 
TGGTCCTCTA 
TTGACCTTCC 
GCACTAGATT 
AGAAAGAATT 
GCCCCAACAA 
ACAGTAAAAC 
ATTCAGCAAA 
GGAAAACCTG 
TGGCATCGGG 
AAGAAAACCA 
ACGGTTTTTG 
TTGATCACAG 
GACTCTTCAG 
GAGGATATAA 
GTAACAGAGG 
GATGATTTTC 
CATGTTTCTG 
ACGGGAGAGG 
GAAATAGACG 
TATGAATATA 
GGTGTACCAG 
GAGAAAGGAC 
CCAGGACCAG 
CCCCCTGGTG 
GGTCTACCTG 
TCCAAAGGAC 
CGGATTGCTC 
GGGGGGCCTG 
CGAGGCGTCC 
GCAGATGGAG 
GGACTTCCGG 
CCAGGTCCTC 
CTTCCAGGTG 
GGGCAGCCTG 
CAAGGGGAGC 
CCACAAGGTC 
GGACTTCCTG 
AAGGGGGCTC 
GTAAAGGGAG 
GGTTTTCCAG 
ATTGGCCCAA 
GACCCAGGTC 
GGATATCCAG 
AATGGAGAGA 
CCAACGGGTC 
GGCACTTCAG 
CAGGGTCCAG 
TGCCCAGGAC 
GGGCCAGGGG 
CGTGGGTATC 
AAAGAAGGTG 
GGATTACGTG 
AAAGGAGGGG 
TCAGCAGGTA 
GGTCCAGCTG 
GATGGAGTTC 
GAAGACGGAG 
GGAGAAAATG 
GCTGGAGGTG 
GATGAGGGTG 
GGCCCACCTG 
CCAGGCCCAA 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 



i 
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GAGGCCCTCA AGGTCCCAAT GGAGCTGATG GACCACAAGG ACCCCCAGGT TCTGTTGGTT 3900 

CAGTTGGTGG TGTTGGAGAA AAGGGTGAAC CTGGAGAAGC AGGAAACCCA GGGCCTCCTG 3 960 

GGGAAGCAGG TGTAGGCGGT CCCAAAGGAG AAAGAGGAGA GAAAGGGGAA GCTGGTCCAC 4020 

CTGGAGCTGC TGGACCTCCA GGTGCCAAGG GGCCGCCAGG TGATGATGGC CCTAAGGGTA 4080 

ACCCGGGTCC TGTTGGTTTT CCTGGAGATC CTGGTCCTCC TGGGGAACTT GGCCCTGCAG 4140 

GTCAAGATGG TGTTGGTGGT GACAAGGGTG AAGATGGAGA TCCTGGTCAA CCGGGTCCTC 42 0 0 

CTGGCCCATC TGGTGAGGCT GGCCCACCAG GTCCTCCTGG AAAACGAGGT CCTCCTGGAG 4260 

CTGCAGGTGC AGAGGGAAGA CAAGGTGAAA AAGGTGCTAA GGGGGAAGCA GGTGCAGAAG 4320 

GTCCTCCTGG AAAAACCGGC CCAGTCGGTC CTCAGGGACC TGCAGGAAAG CCTGGTCCAG 43 80 

AAGGTCTTCG GGGCATCCCT GGTCCTGTGG GAGAACAAGG TCTCCCTGGA GCTGCAGGCC 4440 

AAGATGGACC ACCTGGTCCT ATGGGACCTC CTGGCTTACC TGGTCTCAAA GGTGACCCTG 4500 

GCTCCAAGGG TGAAAAGGGA CATCCTGGTT TAATTGGCCT GATTGGTCCT CCAGGAGAAC 4560 

AAGGGGAAAA AGGTGACCGA GGGCTCCCTG GAACTCAAGG ATCTCCAGGA GCAAAAGGGG 4620 

ATGGGGGAAT TCCTGGTCCT GCTGGTCCCT TAGGTCCACC TGGTCCTCCA GGCTTACCAG 4 680 

GTCCTCAAGG CCCAAAGGGT AACAAAGGCT CTACTGGACC CGCTGGCCAG AAAGGTGACA 4740 

GTGGTCTTCC AGGGCCTCCT GGGCCTCCAG GTCCACCTGG TGAAGTCATT CAGCCTTTAC 4800 

CAATCTTGTC CTCCAAAAAA ACGAGAAGAC ATACTGAAGG CATGCAAGCA GATGCAGATG 4860 

ATAATATTCT TG AT TACT CG GATGGAATGG AAGAAATATT TGGTTCCCTC AATTCCCTGA 4920 

AACAAGACAT CGAGCATATG AAATTTCCAA TGGGTACTCA GACCAATCCA GCCCGAACTT 4980 

GTAAAGACCT GCAACTCAGC CATCCTGACT TCCCAGATGG TGAATATTGG ATTGATCCTA 5040 

ACCAAGGTTG CTCAGGAGAT TCCTTCAAAG TTTACTGTAA TTTCACATCT GGTGGTGAGA 5100 

CTTGCATTTA TCCAGACAAA AAATCTGAGG GAGTAAGAAT TTCATCATGG CCAAAGGAGA 5160 

AACCAGGAAG TTGGTTTAGT GAATTTAAGA GGGGAAAACT GCTTTCATAC TTAGATGTTG 522 0 

AAGGAAATTC CATCAATATG GTGCAAATGA CATTCCTGAA ACTTCTGACT GCCTCTGCTC 52 80 

GGCAAAATTT CACCTACCAC TGTCAT CAGT CAGCAGCCTG GTATGATGTG TCATCAGGAA 5340 

GTTATGACAA AGCACTTCGC TTCCTGGGAT CAAATGATGA GGAGATGTCC TATGACAATA 5400 

ATCCTTTTAT CAAAACACTG TATGATGGTT GT ACGT CCAG AAAAGGCTAT GAAAAAACTG 5460 

TCATTGAAAT CAATACACCA AAAATTGATC AAGTACCTAT TGTTGATGTC ATGATCAGTG 5520 

ACTTTGGTGA TCAGAATCAG AAGTTCGGAT TTGAAGTTGG TCCTGTTTGT TTTCTTGGCT 5580 

AAGATTAAGA CAAAGAACAT ATCAAAT CAA CAGAAAATGT ACCTTGGTGC CACCAACCCA 5640 

TTTTGTGCCA CATGCAAGTT TTGAATAAGG ATGTATGGAA AACAACGCTG CATATACAGG 5700 

TACCATTTAG GAAATAC CG A TGCCTTTGTG GGGGCAGAAT CACAGACAAA AGCTTTGAAA 5760 

ATCATAAAGA TATAAGTTGG TGTGGCTAAG ATGGAAACAG GGCTGATTCT TGATTCCCAA 582 0 

TTCTCAACTC TCCTTTTCCT ATTTGAATTT CTTTGGTGCT GTAGAAAACA AAAAAAGAAA 5 880 

AATATATATT CATAAAAAAT ATGGTGCTCA TTCTCATCCA TCCAGGATGT ACTAAAACAG 5940 

TGTGTTTAAT AAATTGTAAT TATTTTGTGT ACAGTTCTAT ACTGTTATCT GTGTCCATTT 600 0 

CCAAAACTTG CACGTGTCCC TGAATTCCGC TGACT CTAAT TTATGAGGAT GCCGAACTCT 6060 

GATGGCAATA ATATATGTAT TATGAAAATG AAGTTATGAT TTCCGATGAC CCTAAGTCCC 6120 
TTTCTTTGGT TAATGATGAA ATTCCTTTGT GTGTGTTT 

Seq ID NO: 361 Protein sequence 
Protein Accession #: NP_001845 

1 11 21 31 41 51 

1 I I I I I 

MEPWSSRWKT KRWLWDFTVT TLALTFLFQA REVRGAAPVD VLKALDFHNS PEGISKTTGF 60 

CTNRKNSKGS DTAYRVSKQA QLSAPTKQLF PGGTFPEDFS ILFTVKPKKG IQSFLLSIYN 120 

EHGIQQIGVE VGRSPVFLFE DHTGKPAPED YPLFRTVNIA DGKWHRVAIS VEKKT VTM I V 180 

DCKKKTTKPL DRSERAIVDT NGITVFGTRI LDEEVFEGDI QQFLITGDPK AAYDYCEHYS 240 

PDCDSSAPKA AQAQEPQIDE YAPEDIIEYD YEYGEAEYKE AESVTEGPTV TEETIAQTEA 300 

NIVDDFQEYN YGTMESYQTE APRHVSGTNE PNPVEEIFTE EYLTGEDYDS QRKNSEDTLY 360 

ENKEIDGRDS DLLVDGDLGE YDFYEYKEYE DKPTSPPNEE FGPGVPAETD ITETSINGHG 420 

AYGEKGQKGE PAWEPGMLV EGPPGPAGPA GIMGPPGLQG PTGPPGDPGD RGPPGRPGLP 480 

GADGLPGPPG TMLMLPFRYG GDGSKGPTIS AQEAQAQAIL QQARIALRGP PGPMGLTGRP 540 

GPVGGPGSSG AKGESGDPGP QGPRGVQGPP GPTGKPGKRG RPGADGGRGM PGEPGAKGDR 600 

GFDGLPGLPG DKGHRGERGP QGPPGPPGDD GMRGEDGEIG PRGLPGEAGP RGLLGPRGTP 660 

GAPGQPGMAG VDGPPGPKGN MGPQGEPGPP GQQGNPGPQG LPGPQGPIGP PGEKGPQGKP 720 

GLAGLPGADG PPGHPGKEGQ SGEKGALGPP GPQGPIGXPG PRGVKGADGV RGLKGSKGEK 780 

GEDGFPGFKG DMGLKGDRGE VGQIGPRGXD GPEGPKGRAG PTGDPGPSGQ AGEKGKLGVP 840 

GLPGYPGRQG PKGSTGFPGF PGANGEKGAR GVAGKPGPRG QRGPTGPRGS RGARGPTGKP 900 

GPKGTSGGDG PPGPPGERGP QGPQGPVGFP GPKGPPGPPG RMGCPGHPGQ RGETGFQGKT 960 

GPPGPGGWG PQGPTGETGP IGERGYPGPP GPPGEQGLPG AAGKEGAKGD PGPQGISGKD 102 0 

GPAGLRGFPG ERGLPGAQGA PGLKGGEGPQ GPPGPVGSPG ERGSAGTAGP IGLRGRPGPQ 1080 

GPPGPAGEKG APGEKGPQGP AGRDGVQGPV GLPGPAGPAG SPGEDGDKGE IGEPGQKGSK 1140 

GGKGENGPPG PPGLQGPVGA PGIAGGDGEP GPRGQQGMFG QKGDEGARGF PGPPGPIGLQ 12 00 

GLPGPPGEKG ENGDVGPWGP PGPPGPRGPQ GPNGADGPQG PPGSVGSVGG VGEKGEPGEA 12 60 

GNPGPPGEAG VGGPKGERGE KGEAGPPGAA GPPGAKGPPG DDGPKGNPGP VGFPGDPGPP 132 0 

GELGPAGQDG VGGDKGEDGD PGQPGPPGPS GEAGPPGPPG KRGPPGAAGA EGRQGEKGAK 13 80 

GEAGAEGPPG KTGPVGPQGP AGKPGPEGLR GIPGPVGEQG LPGAAGQDGP PGPMGPPGLP 1440 

GLKGDPGSKG EKGHPGLIGL IGPPGEQGEK GDRGLPGTQG SPGAKGDGGI PGPAGPLGPP 1500 

GPPGLPGPQG PKGNKGSTGP AGQKGDSGLP GPPGPPGPPG EVIQPLPILS SKKTRRHTEG 1560 

MQADADDNIL DYSDGMEEIF GSLNSLKQDI EHMKFPMGTQ TNPARTCKDL QLSHPDFPDG 162 0 

EYWIDPNQGC SGDSFKVYCN FTSGGETCIY PDKKSEGVRI SSWPKEKPGS WFSEFKRGKL 1680 

LSYLDVEGNS INMVQMTFLK LLTASARQNF TYHCHQSAAW YDVSSGSYDK ALRFLGSNDE 1740 

EMS YDNNP F I KTLYDGCTSR KGYEKTVIEI NTPKIDQVPI VDVMISDFGD QNQKFGFEVG 1800 
PVCFLG 



Seq ID NO: 362 DNA sequence 
Nucleic Acid Accession #: NM_003107 
Coding sequence: 351-1775 

1 11 21 31 41 51 

11)111 

TTCCCCAGCA TTCGAGAAAC TCCTCTCTAC TTTAGCACGG TCTCCAGACT CAGCCGAGAG 60 
ACAGCAAACT GCAGCGCGGT GAGAGAGCGA GAGAGAGGGA GAGAGAGACT CTCCAGCCTG 120 
GGAACTATAA CTCCTCTGCG AGAGGCGGAG AACTCCTTCC CCAAATCTTT TGGGGACTTT 180 



322 



10 



15 



20 



25 



30 



35 



40 



45 
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TCTCTCTTTA CCCACCTCCG 
CGTCTTCCCG TTCGGCGTGT 
CGGCCGCCGC GAGGGTGTGA 
AAACCAACAA TGCCGAGAAC 
CCGGCCTCGA GCTGGGAATC 
GCAAGGCCGA CGACCCGAGC 
ACGCCTTCAT GGTGTGGTCG 
TGCACAACGC CGAGATCTCC 
ACAAG AT CCC TTTCATTCGA 
CCGACTACAA GTACCGGCCC 
CGGCCGCCGC CTCCTCCAAG 
GCGGCCATGG GGGCGGCGGC 
CGAGTGGCGG CGGCGCCAAC 
CGGGCGGCGC GGGCGGTGGG 
GCGGCGGCGG GAAAGCAGCG 
CCGCCGCCCT GCTGCCCCTG 
CTCCCAGCGC CTCGGCCTCC 
CGGGCAAGCA CCTGGCGGAG 
CGTCGT CGTC GCCCGTGGGC 
TGTACGAGGA GGAGGGCGCG 
GCGCCGCCTC GTCCCCCGCC 
TGCGCGCCGC CTCGCCCGCC 
CCCACTCCTC CTCTTCCTCC 
ACCTGCTCGA CCTGAACCCC 
CGTCGTCGGC GCTCGACCGG 
TCGAGTTCCC GGACTACTGC 
AGTCCAGCAT CTCCAACCTG 
CGGGGGGGGT AGGAGAGGAG 
GAGTTTAAAG AGAAAAGGGA 
TCTCGTCGTC GGAT CAAGGA 
TCCCGGGCCG GGGACCCACT 
AGGGGCGACC TGTGATTGTT 
TTCGAGTTTG CTCCCCTTTG 
TTGTCTGCAC CCCCAGCAAG 
CTTCCTGCAT CACCACCTTG 
GAACCCAGCG CACCCCTCCC 
GGTGACGAAT TTGGCCGATG 
GCAGGCGAAT TCCCGTTTGG 
AGCCGGAGGA GGAGATGTTG 
ACCCGAGAAC CCCGTTGGAA 
CGAACTGGAA GGGGGTTCAC 
CGGCGGCTGC TGGGCCTCCG 
GACCCCGGAG GCGTGGAGGA 
GGCGAGTGGT TTCGGAAAAA 



PCT/US02/12476 



CCCCTGCGAG 
GCTTGGCCCG 
GCGCGCGTGG 
ACGGAAGCGC 
GCCTCCTCCC 
TGGTGCAAGA 
CAG AT CGAGC 
AAGCGGCTGG 
GAGGCGGAGC 
AGGAAGAAGG 
CCGGGGGAGA 
GGCGGCGGGA 
TCCAAACCGG 
GTTAGCAAAC 
GCTGCCGCCG 
GGCGCCGCCG 
GCCTCCTCGG 
AAGAAGGTGA 
GGCGTGGGCG 
GGCTGCTCGC 
GCCGGCCGCT 
CCGTCCAGCG 
TCCTCGGGCT 
AGCTCAAACT 
GACCTGGATT 
ACGCCCGAGG 
GTTTTCACCT 
AAAAAAAAAG 
AAAAAGAAAG 
GGGCGGCGGC 
CTGCCCAGCC 
GTTATTGATG 
CTTGAAGAGA 
AAGGCGAGTT 
GTTTTGTTTT 
CCCCTTTTTT 
GCAGATGTTT 
GGCCTTTTTT 
AGGGGAGGAG 
GCGCAGCAGC 
GGTCAAACTG 
CCTTCTTTTC 
GAGGAGACTG 
AAAAAAGAAA 



GAGTTGAGGG 
GGGAACCGGG 
GCGCCCGCCG 
TGCTGGCCGG 
CCACGCCCGG 
CCCCGAGTGG 
GGCGCAAGAT 
GCAAACGCTG 
GGCTGCGCCT 
TGAAGTCCGG 
AGGGAGACAA 
GCAGCAACGC 
CGCAGAAAAA 
CGCACGCCAA 
CCGCCTCCTT 
CCGACCACCA 
CAGCCTCGGC 
AGCGCGTCTA 
CGGGAGCCGA 
CCGACGCGCC 
CGCCCGCCGA 
CGCCCTCGCA 
CCTCGTCCTC 
TTGAGAGCAT 
TTAACTTCGA 
TG AG CG AG AT 
ACTGAAGGGC 
TGAAAAAAAG 
AAAAAGTAAG 
GTTTTGGACC 
GGAGGGACGC 
TTGTTGTTGA 
CCCCCTCCCC 
AGTTTTCTAG 
ATTTTGCTTC 
TAAACGCGTG 
TGGGGGAACG 
TCCTCCCTCT 
GCCAGCCAGT 
GGGAGCTAGG 
AAATGGATTT 
TACGTGAAAT 
TTTGATGTGG 
AAAAGGG 



GCCAGTTCGG 
AGGGCCCGGC 
AGCCGAGGCC 
CGAGAGCTCG 
CTCCACCGCC 
GCACAT CAAG 
CATGGAGCAG 
GAAGCTGCTC 
CAAG CACAT G 
CAACGCCAAC 
GGTCGGTGGC 
GGGGGGAGGA 
GAGCTGCGGC 
GCTCATCCTG 
CGCCGCCGAA 
CTCGCTGTAC 
CTCCGCAGCG 
CCTGTTCGGC 
CCCCAGCGAC 
CAGCCTGAGC 
CCACCGCGGC 
CGCGTCCTCC 
CGACGACGAG 
GTCCCTGGGC 
GCCCGGCTCC 
GATCTCGGGA 
GCGCAGGCAG 
AAACGAAAAG 
CAGGGCTCGT 
CGCGCTCCCA 
GGAGGAGGAA 
TGGCAAAAAA 
CTTCCAACGA 
AGACTTGAAG 
TTGGTCAAGA 
ATGAAGACAG 
CCGGGACTGA 
TTTCCCCTTG 
GTGACCGGCG 
GGCGGGGGCG 
GCACGTTGGG 
CAGTGAGGTG 
TACAGGGGCA 



CCGCCGCGCG 240 

GATCGCGCGG 300 

ATGGTGCAGC 360 

GACTCGGGCG 420 

TCCACGGGCG 480 

CGACCCATGA 540 

TCGCCCGACA 600 

AAAGACAGCG 660 

GCTGACTACC 720 

TCCAGCTCCT 780 

AGTGGCGGGG 840 

GGCGGCGGTG 900 

TCCAAAGTGG 960 

GCAGGCGGCG 1020 

CAGGCGGGGG 1080 

AAGGCGCGGA 1140 

CTCGCGGCCC 1200 

GGCCTGGGCA 1260 

CCCCTGGGCC 1320 

GGCCGCAGCA 13 80 

TACGCCAGCC 1440 

TCGGCCTCGT 150 0 

TTCGAAGACG 1560 

AGCTTCAGTT 162 0 

GGCTCGCACT 1680 

GACTGGCTCG 1740 

GGAGAAGGGC 1800 

GACAGACGAA 1860 

TCGCCCGCGT 192 0 

TCCCCCACCT 1980 

GAGGGTAGAC 2040 

AAAAAGCGAC 2100 

GCTTCCGGAC 2160 

GAGTCTCCCC 2220 

AAGGAGGGGA 2280 

AAGGCTCCGG 2 3 40 

GAGACTCCAC 2400 

CCCCCTCTGC 2460 

CTAGGAAATG 2520 

GAGGAGGACA 2580 

GAGCTGGCGG 2640 

AGACTTCCCA 2700 

GTCAGTGGAG 2760 



Seq ID NO: 363 Protein sequence 
Protein Accession #: NP 003098 



50 



55 



60 



65 



70 



75 



80 



85 



MVQQTNNAEN 
RPMNAFMVWS 
ADYPDYKYRP 
GGGASGGGAN 
QAGAAALLPL 
GLGTSSSPVG 
YASLRAASPA 
SFSSSSALDR 



TE ALL AGES S 
QIERRKIMEQ 
RKKVKSGNAN 
SKPAQKKSCG 
GAAADHH SLY 
GVG AG AD PSD 
PSSAPSHASS 
DLDFNFEPGS 



21 
I ' 

DSGAGLELGI 
S PDMHNAE I S 
SSSSAAASSK 
SKVAGGAGGG 
KARTPSASAS 
PLGLYEEEGA 
SASSHSSSSS 
GSHFEFPDYC 



31 

1 

ASSPTPGSTA 
KRLGKRWKLL 
PGEKGDKVGG 
VSKPHAKL I L 
ASSAASASAA 
GCSPDAPSLS 
SSGSSSSDDE 
TPEVSEMISG 



41 
I 

STGGKADDPS 
KDSDKIPFIR 
SGGGGHGGGG 
AGGGGGGKAA 
LAAPGKHLAE 
GRSSAASSPA 
FEDDLLDLNP 
DWLESSISNL 



51 
I 

WCKTPSGHIK 
EAERLRLKHM 
GGGSSNAGGG 
AAAAASFAAE 
KKVKRVYLFG 
AGRSPADHRG 
SSNFESMSLG 
VFTY 



Seq ID NO: 3 64 DNA sequence 
Nucleic Acid Accession #: U10860 
Coding sequence: 123-2204 



11 



21 



TGCCGGCTGC 
GGCACCCTCC 
CGATGGCTCT 
GCCACCACCA 
TCATAGACCG 
CAGCATTTGC 
CTGTGTATGC 
TTCTTGGAAT 
AAAAAAGTGT 
TCAGGGGCCT 
TAGCTGATGG 
AATCTAAAAA 
AAGTAATACT 
AGAACAGAGA 
TGGTTTTACT 
TGAACCAAGA 
GCCAGTCTGT 
CTCATTCTTT 
GGAAAAGAAT 
TTGGGGATAC 
AGGAGGTTTT 



TCCTCGACCA 
CGCCCCGTCT 
GTGCAACGGA 
CTATGAAGGA 
AAGAGTGAGG 
TATAAAGGAA 
TGAAGATGCT 
TTGCTATGGT 
CAGAGAAGAT 
TCAGAAGGAA 
ATTCAAGGTT 
GTTATATGGA 
GAAGAATTTC 
ACTTGAGTGT 
CAGTGGTGGA 
ACAAGTCATT 
TGAAGAGGCC 
CTACAATGGA 
TAGCAAAACG 
TTTTGTTAAG 
CCTTGCCCAA 



GGCCTCCTTC 
CGTACTGTCG 
GACTCCAAGC 
GCTGTTGTCA 
GAACTGTTCG 
CAAGGAT TCC 
CCCTGGTTTG 
ATGCAGATGA 
GGAGTTTTCA 
GAAGTTGTTT 
GTGGCACGTT 
GCACAGTTCC 
CTTTATGATA 
ATTCGAGAGA 
GTAGACTCAA 
GCTGTG CACA 
CTCAAAAAGC 
ACAACAACCC 
TTAAATATGA 
ATTGCCAATG 
GGTACTTTAC 



31 
1 

TCAACCTCAG 
CCGTCACCGC 
TGGAGAATGC 
TTCTGGATGC 
TGCAGTCTGA 
GTGCTATTAT 
ATCCAGCAAT 
TGAATAAG GT 
ACATTAGTGT 
TGCTTACACA 
CTGGAAACAT 
ACCCTGAAGT 
TAGCTGGATG 
TCAAAGAGAG 
CAGTTTGTAC 
TTGATAATGG 
TTGGAATTCA 
TACCAATATC 
CCACAAGTCC 
AAGTAATTGG 
GGCCTGATCT 



41 

I 

CCCGCGGCGC 
CGCGGCTCCG 
TGGAGGAGAC 
TGGTGCTCAG 
AATTTTCCCC 
CATCTCTGGA 
ATTCACTATT 
ATTTGGAGGT 
GGATAATACA 
TGGAGATAGT 
AGTAGCAGGC 
TGGCCTTACA 
CAGTGGAACC 
AGTAGGCACG 
AGCTTTGCTA 
CTTTATGAGA 
GGTCAAAGTG 
AGATGAAGAT 
TGAAGAGAAA 
AGAAATGAAC 
AATTGAAAGT 



51 
I 

CGACCCTTCC 
GCCCTGGCCC 
CTTAAGGATG 
TACGGGAAAG 
TTGGAAACAC 
GGACCTAATT 
GGCAAGCCTG 
ACTGTGCACA 
TGTTCATTAT 
GTAGACAAAG 
ATAGCAAATG 
GAAAATGGAA 
TTCACCGTGC 
TCAAAAGTTT 
AATCGTGCTT 
AAACGAGAAA 
ATAAATGCTG 
AGAACCCCAC 
AGAAAAATCA 
TTGAAACCAG 
GCATCCCTTG 



60 
120 
180 
240 
300 
360 
420 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
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10 



15 



WO 02/086443 

TTGCAAGTGG CAAAGCTGAA 
AGTTGAGAGA GGAGGGAAAA 
GAATTTTGGG CAGAGAACTT 
GTCCTGGCCT GGCAATCAGA 
CTGAAACCAA CAATATTTTG 
ATACCCTATT AC AG AG AGT C 
AAATTACCAG TCTGCATTCA 
AGGGTGACTG TCGTTCCTAC 
GGGAATCACT TATTTTT CTG 
TTGTT TATAT ATTTGGCCCA 
TGACAACAGG GGTGCTCAGT 
GGGAGTCTGG GTATGCTGGG 
TTGATCGGGA CCCACTTCAA 
TTATTACTAG TGACTTCATG 
AGGTGGTATT AAAGATGGTC 
ATGACTTAAC ATCAAAGCCC 



PCT/US02/12476 



CTC AT CAAAA 
GTAATAGAAC 
GGACTTCCAG 
GTAATATGTG 
AAAATAGTAG 
AAAGCCTGCA 
CTGAATGCCT 
AGTTACGTGT 
GCTAGGCTTA 
CCAGTTAAAG 
ACTTTACGCC 
AAAATCAGCC 
AAGCAGCCTT 
ACTGGTATAC 
ACTGAGATTA 
CCAGGAACTA 



CCCATCACAA 
CTCTGAAAGA 
AAGAGTTAGT 
CTGAAGAACC 
CTGATTTTTC 
CAACAGAAGA 
TCTTGCTGCC 
GTGGAATCTC 
TACCTCGCAT 
AACCTCCTAC 
AAGCTGATTT 
AGATGCCGGT 
CATGCCAGAG 
CTGCAACACC 
AGAAGATTCC 
CTGAGTGGGA 



TGACACAGAG 
TTTT CATAAA 
TTCCAGGCAT 
TTATATTTGT 
TGCAAGTGTT 
GGATCAGGAG 
AATTAAAACT 
CAGTAAAGAT 
GTGTCACAAC 
AGATGTTACT 
TGAGGCCCAT 
GATTTTGACA 
ATCTGTGGTT 
TGGCAATGAG 
TGGTATTTCT 
GTAATAAACT 



CTCATCAGAA 1320 

GATGAAGTGA 13 80 

CCATTTCCAG 1440 

AAGGACTTTC 1500 

AAAAAGCCAC 1560 

AAGCTGATGC 1620 

GTAGGTGTGC 1680 

GAACCTGACT 1740 

GTTAACAGAG 180 0 

CCCACTTTCT 1860 

AACATTCTCA 192 0 

CCATTACATT 1980 

ATTCGAACCT 2040 

ATCCCTGTAG 2100 

CGAATTATGT 2160 
TC 



20 



Seq ID NO: 365 Protein sequence 
Protein Accession #: AAA60331 



25 



30 



35 



I 

MALCNGDSKL 
AF A I KEQGFR 
KSVREDGVFN 
SKKLYGAQFH 
VLLSGGVDST 
HSFYNGTTTL 
EVFLAQGTLR 
ILGRELGLPE 
TLLQRVKACT 
ESLIFLARLI 
ESGYAGKISQ 
WLKMVTEIK 



11 
I 

ENAGGDIjKDG 
AIIISGGPNS 
ISVDNTCSLF 
PEVGLTENGK 
VCTALLNRAI* 
PI SDEDRTPR 
PDLIESASLV 
ELVSRHPFPG 
TEEDQEKLMQ 
PRMCHNVNRV 
MPVILTPLHF 
KIPGISRIMY 



21 
I 

HHHYEGAWI 
VYAEDAPWFD 
RGIjQKEEWL 
VILKNFLYDI 
NQEQVIAVHI 
KRISKTLNMT 
ASGKAELIKT 
PGLAIRVICA 
ITSLHSLNAF 
VYIFGPPVKE 
DRDPLQKQPS 
DLTSKPPGTT 



31 



LDAGAQYGKV 
PAIFTIGKPV 
LTHGDSVDKV 
AGCSGTFTVQ 
DNGFMRKRES 
TSPEEKRKII 
HHNDTEL I RK 
EEPYICKDFP 
LLPIKTVGVQ 
PPTDVTPTFL 
CQRSWIRTF 
EWE 



41 
I 

IDRRVRELFV 
LGICYGMQMM 
ADGFKWARS 
NRELECIREI 
QSVEEALKKL 
GDTFVKIANE 
LREEGKVIEP 
ETNNILKIVA 
GDCRSYSYVC 
TTGVLSTLRQ 
ITSDFMTGIP 



51 
I 

QSEIFPLETP 60 

NKVFGGTVHK 120 

GNIVAGIANE 180 

KERVGTS KVL 240 

GIQVKVINAA 3 00 

VIGEMNLKPE 360 

LKDFHKDEVR 420 

DFSASVKKPH 480 

GISSKDEPDW 540 

ADFEAHNILR 600 

ATPGNEIPVE 660 



40 



45 



50 



55 



60 



Seq ID NO: 3 66 DNA sequence 
Nucleic Acid Accession #: NM_004219 
Coding sequence: 46-654 



GCGGCCTCAG 
TATGTTGATA 
CTGGGGTCTG 
TTTGG CAAAA 
ACTGTCAACA 
CCAAGCTTTT 
GCCTCAGATG 
GAGAGTTTTG 
CTCATGATCC 
CCTGTGAAGA 
CTGTCGACCC 
TAGTGCTTCA 
AAAAAAAA 



11 
I 

ATGAATGCGG 
AGGAAAATGG 
GACCTTCAAT 
CGTTCGATGC 
GAGCTACAGA 
CTG CCAAAAA 
ATGCCTATCC 
ACCTGCCTGA 
TTGACGAGGA 
TGCCCTCTCC 
TGGATGTTGA 
GAGTTTGTGT 



21 



CTGTTAAGAC 
AGAACCAGGC 
CAAAGCCTTA 
CCCACCAGCC 
AAAGTCTGTA 
GATGACTGAG 
AGAAATAGAA 
AGAGCACCAG 
GAGAGAGCTT 
ACCATGGGAA 
ATTGCCACCT 
GTATTTGTAT 



31 

1 

CTGCAATAAT 
ACCCGTGTGG 
GATGGGAGAT 
TTACCTAAAG 
AAGACCAAGG 
AAGACTGTTA 
AAATTCTTTC 
ATTGCGCACC 
GAAAAGCTGT 
TCCAATCTGT 
GTTTGCTGTG 
TAATAAAGCA 



41 



51 



CCAGAATGGC 
TTGCTAAGGA 
CTCAAGTTTC 
CTACTAGAAA 
GACCCCTCAA 
AAGCAAAAAG 
CCTTCAATCC 
TCCCCTTGAG 
TTCAGCTGGG 
TGCAGTCTCC 
ACATAGATAT 
TTCTTCAACA 



TACTCTGATC 
TGGGCTGAAG 
AACACCACGT 
GGCTTTGGGA 
ACAAAAACAG 
CTCTGTTCCT 
TCTAGACTTT 
TGGAGTGCCT 
CCCCCCTTCA 
TTCAAGCATT 
TTAAATTTCT 
GAAAAAAAAA 



65 



Seq ID NO: 367 Protein sequence 
Protein Accession #: NP_004210 

1 11 21 31 41 51 

I I I 1 I I 

MATLIYVDKE NGEPGTRWA KDGLKLGSGP SIKALDGRSQ VSTPRFGKTF DAPPALPKAT 

RKALGTVNRA TEKSVKTKGP LKQKQPSFSA KKMTEKTVKA KSSVPASDDA YPEIEKFFPF 

NPLDFESFDL PEEHQIAHLP LSGVPLMILD EERELEKLFQ LGPPSPVKMP SPPWESNLLQ 

SPSSILSTLD VELPPVCCDI DI 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 



60 
120 
180 



70 



75 



80 



85 



Seq ID NO: 3 68 DNA sequence 
Nucleic Acid Accession #: NM_000597 
Coding sequence: 118-1104 



ATTCGGGGCG 
CCTGCCCGCC 
CTGCCGAGAG 
CCGCTGCTGC 
CTGTTCCGCT 
GCGCCGCCCG 
GTCCGGGAGC 
GGCGTCTACA 
CTGCCCCTGC 
TATGGCGCCA 
GTGGAGAACC 
AAGCCCCTCA 
CACCGGCAGA 
CGACCACCCC 



11 

1 

AGGGAGGAGG 
CGCCCGCTCG 
TGGGCTGCCC 
TGCTGCTACT 
GCCCGCCCTG 
CCGCGGTGGC 
CGGGCTGCGG 
CCCCGCGCTG 
AGGCGCTGGT 
GCCCGGAGCA 
ACGTGGACAG 
AGTCGGGTAT 
TGGGCAAGGG 
CTGCCAGGAC 



21 

1 

AAGAAGCGGA 
CTCGCTCGCC 
CGCGCTGCCG 
GGGCGCGAGT 
CACACCCGAG 
CGCAGTGGCC 
CTGCTGCTCG 
CGGCCAGGGG 
CATGGGCGAG 
GGTTGCAGAC 
CACCATGAAC 
GAAGGAGCTG 
TGGCAAGCAT 
TCCCTGCCAA 



31 
I 

GGAGGCGGCT 
CGCCGCGCCG 
CTGCCGCCGC 
GGCGGCGGCG 
CGCCTGGCCG 
GGAGGCGCCC 
GTGTGCGCCC 
CTGCGCTGCT 
GGCACTTGTG 
AATGGCGATG 
ATGTTGGGCG 
GCCGTGTTCC 
CACCTTGGCC 
CAGGAACTGG 



41 



51 



CCCGCTCGCA 
CGCTGCCGAC 
CGCCGCTGCT 
GCGGGGCGCG 
CCTGCGGGCC 
GCATG CCATG 
GGCTGGAGGG 
ATCCCCACCC 
AGAAGCGCCG 
ACCACTCAGA 
GGGGAGGCAG 
GGGAGAAGGT 
TGGAGGAGCC 
ACCAGGTCCT 



GGGCCGTGCA 60 

CGCCAGCATG 12 0 

GCCGCTGCTG 180 

CGCGGAGGTG 240 

CCCGCCGGTT 3 00 

CGCGGAGCTC 3 60 

CGAGGCGTGC 42 0 

GGGCTCCGAG 480 

GGACGCCGAG 540 

AGGAGGCCTG 600 

TGCTGGCCGG 660 

CACTGAGCAG 720 

CAAGAAGCTG 780 

GGAG CGGATC 840 



324 



10 



WO 02/086443 

TCCACCATGC GCCTTCCGGA 
CCCAACTGTG ACAAGCATGG 
CAGCGTGGGG AGTGCTGGTG 
ACCAT CCGGG GGGACCCCGA 
GTGCACACCC AGCGGATGCA 
GCCCCTCTCC AAACACCGGC 
TTCCAGTTCT GACACACGTA 
CCCGGCCTCT CTCTTCCCAG 
GAGGAAGGGG GTTGTGGTCG 
TTTATTTTTG AACCCCTGTG 



TGAGCGGGGC 
CCTGTACAAC 
TGTGAACCCC 
GTGTCATCTC 
GTAGACCGCA 
AGAAAACGGA 
TTTATATTTG 
CTG CAGATGC 
GGGAGCTGGG 
TCCCTTTTGC 



CCTCTGGAGC 
CTCAAACAGT 
AACACCGGGA 
TTCTACAATG 
GCCAGCCGGT 
GAGTGCTTGG 
GAAAGAGACC 
CACACCTGCT 
GTACAGGTTT 
ATAAGATTAA 



ACCTCTACTC 
GCAAGATGTC 
AGCTGATCCA 
AGCAGCAGGA 
GCCTGGCGCC 
GTGGTGGGTG 
AGCACCGAGC 
CCTTCTTGCT 
GGGGAGGGGG 
AGGAAGGAAA 



CCTGCACATC 900 

TCTGAACGGG 960 

GGGAGCCCCC 1020 

GGCTTGCGGG 1 0 B 0 

CCTGCCCCCC 1140 

CTGGAGGATT 1200 

TCGGCACCTC 1260 

TTCCCCGGGG 1320 

AAGAGAAATT 1380 
AGT 



PCT/US02/12476 



15 



20 



Seq ID NO: 369 Protein sequence 
Protein Accession #: NP 000588 



MLPRVGCPAL 
VAPPAAVAAV 
ELPLQALVMG 
RKPLKSGMKE 
ISTMRLPDER 
PTIRGDPECH 



11 
I 

PLPPPPLLPL 
AGGARMPCAE 
EGTCEKRRDA 
LAVFREKVTE 
GPLEHLYSLH 
LFYNEQQEAC 



21 
I 

LPLLLIiLLGA 
LVREPGCGCC 
EYGASPEQVA 
QHRQMGKGGK 
IPNCDKHGLY 
GVHTQRMQ 



31 
I 

SGGGGGARAE 
SVCARLEGEA 
DNGDDHSEGG 
HHLGLEEPKK 
NLKQCKMSLN 



41 
I 

VLPRCPPCTP 
CGVYTPRCGQ 
LVENHVDSTM 
IiRPPPARTPC 
GQRGECWCVN 



51 

! 

ERLAACGPPP 60 

GLRCYPHPGS 120 

NMLGGGGSAG 180 

QQELDQVLER 240 

PNTGKLIQGA 3 00 



Seq ID NO: 370 DNA sequence 
25 Nucleic Acid Accession #: NM_004264 
Coding sequence: 6-440 



30 



35 



40 



GGAACATGGC 
TTTGTAATGC 
AGACAGCAAT 
CAGCACTGAT 
AAGAATCTAC 
AAGCTGCTAC 
AAAGCGCACT 
AGTCTCTTCC 
GTGCCATTAA 
TTAAACACTA 
GATAAGCTTA 
GAGTGAAATT 
AATTCTGTTA 
C 



11 
I 

GGAT CGGCTC 
CATTGGAGTA 
TAACAAAGAC 
TGCACGAACA 
AGCTGCTTTA 
ATGTGTGGAG 
TGCTGATATT 
AGACTCATAG 
GAATTCTGCA 
TGACACATTA 
TAAATCATGA 
ATTAAGG CAT 
TGACATAATT 



21 
I 

ACGCAGCTTC 
TTGCAGCAAT 
CAGCCAGCTA 
GCAAAAGACA 
CAGGCTGCTA 
GATGTTGTTT 
GCACAGTCAC 
CATCAGTGGA 
TCAGACTTAG 
CCTTTTTAGC 
TTGAATCAGC 
GTAATACATT 
TATGTCTCCA 



31 
I 

AGGACGCTGT 
GTGGT CCTCC 
ACCCTACAGA 
TTGATGTTTT 
GCTTGTATAA 
ATCGAGGAGA 
AGCTGAAGAC 
TACCATGTGG 
ATACAAGCCT 
TATTTTTAAT 
TTTAAAGCAT 
AATGAACATA 
TTTTGTTGTA 



41 
I 

GAATTCGCTT 
TGCCTCTTTC 
AGAGTATGCC 
GATAGATTCC 
GCTAGAAGAA 
CATGCTTCTG 
AAGAAGTGGT 
CTGAGAAAAG 
TACCAACAAT 
AGTCTTCTAT 
CAT ACCAT CA 
ATATAAGGAA 
TTGGCCAGTA 



51 
1 

GCAGATCAGT 60 

AATAATATTC 120 

CAGCTTTTTG 180 

TTACCCAGTG 240 

GAAAACCATG 300 

GAGAAGATAC 3 60 

ACCCATAGCC 420 

AACTGTTTGA 480 

TACAGAAACA 540 

TTTCACTCTT 600 

TTTTTTAACT 660 

ACATATGTAA 720 

CTTTTACAAT 7 80 



45 



Seq ID NO: 371 Protein sequence 
Protein Accession NP 004255 



1 ll 21 31 41 51 

en I I I I I I 

D(J madrltqlqd avnsladqfc naigvlqqcg ppasfnniqt ainkdqpanp teeyaqlfaa 

LIARTAKDID VLIDSLPSEE STAALQAASD YKLEEENHEA ATCVEDWYR GDMLLEKIQS 
ALADIAQSQL KTRSGTHSQS LPDS 



60 
120 



Seq ID NO: 372 DNA sequence 
55 Nucleic Acid Accession #: AJ271091 
Coding sequence: 1-1113 



60 



65 



70 



75 



ii 



ATGGAGAATC 
CTGCGCGTGG 
CATTTCAAAG 
TTCTTAGACC 
ACAGTACAGA 
CTGTTTTTGG 
AGAGCTAAGG 
ACTCTTACAA 
TTCTCCTGGA 
TATGACACAT 
GAAACTATCA 
CTTCTTGGAA 
AAAGCTGTGG 
TTCTACATGC 
CTGTGGATTC 
ATTCCAATAT 
AAAGTTAGAT 
ATAAATTTTC 
CATGCCTGTG 



AGGTGTTGAC 
AGCTGAGTGA 
CTCAAGGACA 
TTGTGAAACC 
AGAAAGTGAG 
CTCCTGACTT 
AAGAAGAGCG 
ACTTAAGGAA 
TCTTTGTCAA 
TCCATACTGT 
ATGCAGCAAT 
GAAAT TTTAT 
TTTTCTTTGT 
TGACGTGCAT 
CCTTATATCC 
TCAATGAGAC 
TTTCCTTTTT 
GTCACCTTTA 
ATCCCAGCGC 



21 
I 

GCCGCATGTC 
CGTACAGAAC 
TGGTGCCAAA 
AGAGCCTGTT 
TCAGTGGTGG 
TGATCGTTGG 
CCTAAATAAA 
AGGATACCTG 
CCTGACTGTG 
GGCTGACATG 
TGGAGTCACT 
TTTGTTTATC 
GTTTTATTTG 
TGACATGGAT 
ACTGGGATGT 
CGGACG ATT C 
TCTTCAGATT 
TAAACAG CGC 
TTTGGGAGGC 



31 
I 

TACTGGGCTC 
CCTGCCATCA 
GGAGACAATG 
TACAAACTGA 
GAGAGACTCA 
CTGGATGAAT 
CTCCGACTGG 
TTTATGTATA 
CGATTCTGTA 
ATGTATTTCT 
ACGTCACCGG 
ATCTTTGGCA 
TGGAGTGCAA 
TGGAAGGTGC 
TTGGCGGAAG 
AGTTTCACAT 
TATCTTATAA 
AGACTGAAAA 
TGA 



41 
I 

AGCGACACCG 
G CAT C ACTG A 
TCTATGAATT 
CCCAGAGGCA 
CAAAGCAGGA 
CTGATGCGGA 
AAAGCGAAGG 
ATCTTGTGCA 
TCTTGGGAAA 
GCCAGATGCT 
TGCTGCCTTC 
CCATGGAAGA 
TTGAAATTTT 
TCACATGGCT 
CTGTCTCAGT 
TGCCATATCC 
TGATATTTTT 
TGAGGGCAGG 



51 
I 

CGAGCTATAT 60 

AAACGTGCTG 120 

TCACCTGGAG 180 

GGTAAACATT 240 

AAAGCGACCA 30 0 

AATGGAGCTC 360 

CTCTCCTGAA 42 0 

ATTCTTGGGA 480 

AGAGTCCTTT 540 

GGCAGTTGTG 600 

TCTGATCCAG 660 

AATGCAGAAC 72 0 

CAGGTACTCT 780 

TCGTTACACT 840 

GATTCAGTCC 900 

AGTGAAAATC 960 

AGGTTTATAC 102 0 

CGCAGTGGCT 108 0 



80 



Seq ID NO: 3 73 Protein sequence 
Protein Accession #: CAB69070 



1 11 21 31 41 51 

or I I I I 1 I 

OJ MENQVLTPHV YWAQRHRELY LRVELSDVQN PAISITENVL HFKAQGHGAK GDNVYEFHLE 60 

FLDLVKPEPV YKLTQRQVNI TVQKKVSQWW ERLTKQEKRP LFDAPDFDRW LDESDAEMEL 120 
RAKEEERLNK LRLESEGSPE TLTNLRKGYL FMYNLVQFLG FSWIFVNLTV RFCILGKESF 180 



325 



WO 02/086443 

YDTFHTVADM MYFCQMLAW ETINAAIGVT 
KAWFFVFYL WSAIEIFRYS FYMLTCIDMD 
IPIFNETGRF SFTLPYPVKI KVRFSFFLQI 
HACDPSALGG 



TSPVliPSLIQ LLGRNFILFI IFGTMEEMQN 
WKVLTWLRYT LWIPLYPLGC LAEAVSVIQS 
YLIMIFLGLY INFRHLYKQR RLKMRAGAVA 



Seq ID NO: 374 DNA sequence 
Nucleic Acid Accession NM_016395 
Coding sequence: 1-1113 

1 11 21 31 41 51 

I I I I I I 

ATGGAGAATC AGGTGTTGAC GCCGCATGTC TACTGGGCTC AG CG AC ACCG CGAGCTATAT 

CTGCGCGTGG AG CTGAGTGA CGTACAGAAC CCTGCCATCA GCATCACTGA AAACGTGCTG 

CATTTCAAAG CTCAAGGACA TGGTGCCAAA GGAGACAATG TCTATGAATT TCACCTGGAG 

TTCTTAGACC TTGTGAAACC AGAGCCTGTT TACAAAC T G A CCCAGAGGCA GGTAAACATT 

ACAGTACAGA AGAAAGTGAG TCAGTGGTGG GAGAGACTCA CAAAGCAGGA AAAGCGACCA 

CTGTTTTTGG CTCCTGACTT TGATCGTTGG CTGGATGAAT CTGATGCGGA AATGGAGCTC 

AGAGCTAAGG AAGAAGAG CG CCTAAATAAA CTCCGACTGG AAAGCGAAGG CTCTCCTGAA 

ACTCTTACAA ACTTAAGGAA AGGATACCTG T T TATGTAT A ATCTTGTGCA ATTCTTGGGA 

TTCTCCTGGA TCTTTGTCAA CCTGACTGTG CGATTCTGTA TCTTGGGAAA AGAGTCCTTT 

TATGACACAT TCCATACTGT GGCTGACATG ATGTATTTCT GCCAGATGCT GGCAGTTGTG 

GAAACTATCA ATGCAGCAAT TGGAGTCACT ACGT CACCGG TGCTGCCTTC TCTGATCCAG 

CTTCTTGGAA GAAATTTTAT TTTGTTTATC ATCTTTGGCA CCATGGAAGA AATGCAGAAC 

AAAGCTGTGG TTTTCTTTGT GTTTTATTTG TGGAGTGCAA TTGAAATTTT CAGGTACTCT 

TTCTACATGC TGACGTGCAT TGACATGGAT TGGAAGGTGC TCACATGGCT TCGTTACACT 

CTGTGGATTC CCTTATATCC ACTGGGATGT TTGGCGGAAG CTGTCTCAGT GATTCAGTCC 

ATTCCAATAT TCAATGAGAC CGGACGATTC AGTTTCACAT TGCCATATCC AGTGAAAATC 

AAAGT T AGAT TTTCCTTTTT TCTTCAGATT TATCTTATAA TGATATTTTT AGGTTTATAC 

ATAAATTTTC GTCACCTTTA TAAACAGCGC AGACTGAAAA TGAGGGCAGG CGCAGTGGCT 

CATGCCTGTG ATCCCAGCGC TTTGGGAGGC TGA 



Seq ID NO: 375 Protein sequence 
Protein Accession #: NP_057479 



11 



MENQVLTPHV 
FLDLVKPEPV 
RAKEEERLNK 
YDTFHTVADM 
KAWFFVFYL 
IPIFNETGRF 
STKKKDLDGF 



YVJAQRHRELY 
YKLTQRQVNI 
LRLESEGSPE 
MYFCQMLAW 
WSAIEIFRYS 
SFTLPYPVKI 
LPV 



21 



31 



LRVEL SDVQN 
TVQKKVSQWW 
TLTNLRKGYL 
ETINAAIGVT 
FYMLTCIDMD 
KVRFSFFLQI 



PAISITENVL 
ERLTKQEKRP 
FMYNLVQFLG 
TSPVLPSLIQ 
WKVLTWLRYT 
YLIMIFLGLY 



41 
I 

HFKAQGHGAK 
LFLAPDFDRW 
FSWIFVNLTV 
LLGRNFILFI 
LWIPLYPLGC 
INFRHLYKQR 



51 
I 

GDNVYEFHLE 
LDESDAEMEL 
RFCILGKESF 
IFGTMEEMQN 
LVEAVSVIQS 
RRRYGKKRKR 



Seq ID NO: 3 76 DNA sequence 
Nucleic Acid Accession #: NM_005987 
Coding sequence: 1-270 



ATGAATTCTC 
GTGAAACAAC 
TGCCAACCCA 
ATTCCAGAGC 
CCAGCCCAGC 



11 

I 

AGCAGCAGAA 
CTTGCCAGCC 
AGGTGCCTGA 
CCTGCCAGCC 
AGAAGACCAA 



21 31 41 51 

I I I I 

GCAGCCTTGC ACCCCACCCC CTCAGCCTCA GCAGCAGCAG 

TCCACCCCAG GAACCATGCA TCCCCAAAAC CAAGGAGCCC 

GCCCTGCCAC CCCAAAGTGC CTGAGCCCTG CCAGCCCAAG 

CAAGGTGCCT GAGCCCTGCC CTTCAACGGT CACTCCAGCA 
GCAGAAGTAA 



Seq ID NO: 3 77 Protein sequence 
Protein Accession #: NP_005978 

1 11 21 31 41 51 

I l I I I I 

MNSQQQKQPC TPPPQPQQQQ VKQPCQPPPQ EPCIPKTKEP CQPKVPEPCH PKVPEPCQPK 
IPEPCQPKVP EPCPSTVTPA PAQQKTKQK 



Seq ID NO: 378 DNA sequence 
Nucleic Acid Accession #: NM_002105 
Coding sequence: 74-505 

1 11 21 31 41 51 

I I l l l I 

ACAGCAGTTA CACTGCGGCG GGCGTCTGTT CTAGTGTTTG AGCCGTCGTG CTTCACCGGT 
CTACCTCGCT AGCATGTCGG GCCGCGGCAA GACTGGCGGC AAGGCCCGCG CCAAGGCCAA 
GTCGCGCT CG TCGCGCGCCG GCCTCCAGTT CCCAGTGGGC CGTGTACACC GGCTGCTGCG 
GAAGGGCCAC TACGCCGAGC GCGTTGGCGC CGGCGCGCCA GTGTACCTGG CGGCAGTGCT 
GGAGTACCTC ACCGCTGAGA TCCTGGAGCT GGCGGGCAAT GCGGCCCGCG ACAACAAGAA 
GACGCGAATC ATCCCCCGCC ACCTGCAGCT GGCCATCCGC AACGACGAGG AGCTCAACAA 
GCTGCTGGGC GGCGTGACGA TCGCCCAGGG AGGCGTCCTG CCCAACATCC AGGCCGTGCT 
GCTGCCCAAG AAGACCAGCG CCACCGTGGG GCCGAAGGCG CCCTCGGGCG GCAAGAAGGC 
CACCCAGGCC TCCCAGGAGT ACTAAGAGGG CCCGCGCCGC GGCCGGCCGC CCCAGCTCCC 
CATGCCACCA CAAAGGCCCT TTTAAGGGCC ACCACCGCCC TCATGGAAAG AGCTGAGCCG 
CTTCAGACTG CGGGGCAAGC GGGCCGCGGC TCCCTTCCCC TCCCCTCCCC TCGCCCGCCT 
TCGCCGCCCG GCCTCGAGTC CCCGCCCGCC CCCGCTCCCG TCCCGCACCG CCTGCCGCGT 
CGGCCTCGGG CCTGCCCTGT CCGCCGTCCG CCCTCCGGTA GGGTTCGGGC CTTCCGGATG 
CGGCTTGGGC GCTCTTCGGG GACCTCCGTG GCGCGGAAGA CCCGAGCCTG CCGGGGGGAG 



326 



WO 02/086443 

GCCGGCGGCG CCGCACCTGC CCGCCTCGGC GTTCGTGACT CAGCCGCCCC ATCCCGAGTC 
GCTAAGGGGC TGCGGGGAGG CCGCAGCACC TTCTGGAAGA CTTGGCCTTC CGCTCTGACG 
CAGGGCCGAG GTGGGCAGTC CAGGCCGAGA GCCGGCGGCC CTGAAGGTGA GTGAGGCCCT 
CGGCAGCTGC AGCCGGGGTG TCTGGTACCC CCCCGGCGTG GTGCTTAGCC CAGGACTTTC 
AGACGGCCGC TGGCCGGGAG GCTTTGGTGG GAGAGACGCG ATCG CCGATT TCGGTCTGGC 
GCCCCTTCTG CGGCCGGGAC CCAGGCCTTT CACATCAGCT CTCCCTCCAT CTTCATTCAT 
AGGTCTGCGC TGGGGCCGGG ACGAAGCACT TGGTAACAGG CACATCTTCC TCCCGAGTGA 
CTGCCTCCTA GGAGGACATT TAGGGGAGGG CAGAGGCCTG CAGTTTGGCT TCACGGCTGG 
CTATGTGGAC AGCAAGAGTC GTTTTGCGGA ACGCGACTGG CAGCCAGGCC TGTCGGGCCC 
CCGACGCCGC CCCATTTCCC TTCCAGCAAA CTCAACTCGG CAATCCAAGC ACCTAGATAC 
CAGCACAAGT CGGTTAATCC CTGTCTGGAC TGAGCCTCCG TTGGCTTCTG AACTGGAATT 
CTGCAGCTAA CCCTTCCACG ACTAGAACCT TAGGCATTGG GGAGTTTTAG ATGGACTAAT 
TTTATTAAAG GATTGTTTTT TTTTT 

Seq ID NO: 379 Protein sequence 
Protein Accession #: NP_002096 

1 ll 21 31 41 51 

l I l I 1 I 

MSGRGKTGGK ARAKAKSRSS RAGLQPPVGR VHRLLRKGHY AERVGAGAPV YLAAVLEYLT 
AEILELAGNA ARDNKKTRI I PRHLQLAIRN DEELNKLLGG VTIAQGGVLP NIQAVLLPKK 
TSATVGPKAP SGGKKATQAS QEY 



Seq ID NO: 3 80 DNA sequence 
Nucleic Acid Accession #: AL136942 
Coding sequence : 184-864 

1 11 21 31 41 51 

I I 1 I I I 

ACGCGTCCGG CAGAAGCTCG GAGCTCTCGG GGTATCGAGG AGGCAGGCCC GCGGGCGCAC 
GGGCGAGCGG GCCGGGAGCC GGAGCGGCGG AGGAGCCGGC AGCAGCGGCG CGGCGGGCTC 
CAGGCGAGGC GGTCGACGCT CCTGAAAACT TGCGCGCGCG CTCGCGCCAC TGCGCCCGGA 
GCGATGAAGA TGGTCGCGCC CTGGACGCGG TTCTACTCCA ACAGCTGCTG CTTGTGCTGC 
CATGTCCGCA CCGGCACCAT CCTGCTCGGC GTCTGGTATC TGATCATCAA TGCTGTGGTA 
CTGTTGATTT TATTGAGTGC CCTGGCTGAT CCGGATCAGT ATAACTTTTC AAGTTCTGAA 
CTGGGAGGTG ACTTTGAGTT CATGGATGAT GCCAACATGT GCATTGCCAT TGCGATTTCT 
CTTCTCATGA TCCTGATATG TGCTATGGCT ACTTACGGAG CGTACAAGCA ACGCGCAGCC 
TGGATCATCC CATTCTTCTG TTACCAGATC TTTGACTTTG CCCTGAACAT GTTGGTTGCA 
ATCACTGTGC TTATTTATCC AAACTCCATT CAGGAATACA TACGGCAACT GCCTCCTAAT 
TTTCCCTACA GAGATGATGT CATGT CAGTG AATCCTACCT GTTTGGTCCT TATTATTCTT 
CTGTTTATTA GCATTATCTT GACTTT TAAG GGTTACTTGA TTAGCTGTGT TTGGAACTGC 
TACCGATACA TCAATGGTAG GAACTCCTCT GATGTCCTGG TTTATGTTAC CAGCAATGAC 
ACTACGGTGC TGCTACCCCC GTATGATGAT GCCACTGTGA ATGGTGCTGC C AAGGAG CCA 
CCGCCACCTT ACGTGTCTGC CTAAGCCTTC AAGTGGGCGG AGCTGAGGGC AGCAGCTTGA 
CTTTGCAGAC ATCTGAGCAA TAGTTCTGTT ATTTCACTTT TGCCATGAGC CTCTCTGAGC 
TTGTTTGTTG CTGAAATGCT ACTTTTTAAA ATTTAGATGT TAGATTGAAA ACTGTAGTTT 
TCAACATATG CTTTGCTAGA ACACTGTGAT AGATTAACTG TAGAAT TCTT CCTGTACGAT 
TGGGGATATA ACGGGCTTCA CTAACCTTCC CTAGGCATTG AAACTTCCCC CAAATCTGAT 
GGACCTAGAA GTCTGCTTTT GTACCTGCTG GGCCCCAAAG TTGGGCATTT TTCTCTCTGT 
TCCCTCTCTT TTGAAAATGT AAAATAAAAC CAAAAATAGA CAACTTTTTC TTCAGCCATT 
CCAGCATAGA GAACAAAACC TTATGGAAAC AGGAATGTCA ATTGTGTAAT CATTGTTCTA 
ATTAGGTAAA TAGAAGTCCT TATGTATGTG TTACAAGAAT TTCCCCCACA ACATCCTTTA 
TGACTGAAGT TCAATGACAG TTTGTGTTTG GTGGTAAAGG ATTTTCTCCA TGGCCTGAAT 
TAAGACCATT AGAAAGCACC AGGCCGTGGG AGCAGTGACC ATCTACTGAC TGTTCTTGTG 
GATCTTGTGT CCAGGGACAT GGGGTGACAT GCCTCGTATG TGT TAG AGGG TGGAATGGAT 
GTGTTTGGCG CTGCATGGGA TCTGGTGCCC CTCTTCTCCT GGATTCACAT CCCCACCCAG 
GGCCCGCTTT TACTAAGTGT TCTGCCCTAG ATTGGTT CAA GGAGGT CATC CAACTGACTT 
TATCAAGTGG AATTGGGATA TATTTGATAT ACTTCTGCCT AACAACATGG AAAAGGGTTT 
TCTTTTCCCT GCAAGCTACA TCCTACTGCT TTGAACTTCC AAGTATGTCT AGTCACCTTT 
TAAAATGTAA ACATT TTC AG AAAAATGAGG ATTGCCTTCC TTGTATGCGC TTTTTACCTT 
GACTACCTGA ATTGCAAGGG ATTTTTATAT ATT CATATGT TACAAAGTCA GCAACTCTCC 
TGTTGGTTCA TTATTGAATG TGCTGTAAAT TAAGTCGTTT GCAATTAAAA CAAGGTTTGC 
CCACATCCAA AAAAAAAAAA AAAAA 

Seq ID NO: 381 Protein sequence 
Protein Accession #: CAB66876 

1 11 21 31 41 51 

l l I l l l 

MKMVAPWTRF YSNSCCLCCH VRTGTILLGV WYLIINAWL I* ILL SALAD P DQYNFSSSEL 
GGDFEFMDDA NMCIAIAISL LMILICAMAT YGAYKQRAAW IIPFFCYQIF DFALNMLVAI 
TVLIYPNSIQ EYIRQLPPNF PYRDDVMSVN PTCLVLIILL FISIILTFKG YLISCVWNCY 
RYINGRNSSD VLVYVT SNDT TVLLPPYDDA TVNGAAKEPP PPYVSA 

Seq ID NO: 382 DNA sequence 
Nucleic Acid Accession #: NM_Q02510 
Coding sequence: 92-1774 

1 11 21 31 41 51 

I l l l I I 

CAGATGCCAG AAGAACACTG TTGCTCTTGG TGGACGGGCC CAGAGGAATT CAGAGTTAAA 
CCTTGAGTGC CTGCGTCCGT GAGAATTCAG CATGGAATGT CTCTACTATT TCCTGGGATT 
TCTGCTCCTG GCTGCAAGAT TGCCACTTGA TGCCGCCAAA CGATTTCATG ATGTGCTGGG 
CAATGAAAGA CCTTCTGCTT ACATGAGGGA G C AC AAT CAA TTAAATGGCT GGTCTTCTGA 
TGAAAATGAC TGGAATGAAA AACTCTACCC AGTGTGGAAG CGGGGAGACA TGAGGTGGAA 
AAACTCCTGG AAGGGAGGCC GTGTGCAGGC GGTCCTGACC AGTGACT CAC CAGCCCTCGT 



327 



10 



15 



20 



25 



30 



35 



40 



WO 02/086443 

GGGCTCAAAT ATAACATTTG 
CAATGGCAAC ATAGTCTATG 
ATATGTTTAC AACTGGACAG 
AAG CCAT CAT AACGTCTTCC 
ATGGAATTTC ATCTACGTCT 
TTCAGTGAGA GTTTCTGTGA 
GACTGTCTAC AGAAGACATG 
CGTGGTAACA GATCAGATTC 
ATCCGACGAA ACCTTCCTCA 
TAGCCACTTC CTCAATTATT 
CCTGTTTGTT TCCACCAATC 
CCTTAACCTC ACTGTGAAAG 
CAGACCTTCA AAACCCACCC 
TAGGATTCCT GATGAAAACT 
AATTGTAGAG GG AATCTTAG 
GCCATGGCCT GAAAGCTCCC 
GGAGGTCTGT ACCATCATTT 
CCCTGTGGAT GTGGATGAGA 
GACGTACTGT GTGAACCTCA 
GATTTCTGTT CCTGACAGAG 
CTCCGTTGGC TGCTTGGCCA 
CAAGGAATAC AACCCAATAG 
TGTCTTTCTC AACCGTGCAA 
ACTCAAAAAC CAAGAATTTA 
TTTTCAGTGC CATTGATGTG 
TTATTGTTAA ATAGATATTG 
TTTAGAGATG GGGAGAGGGA 
AAAGCAACTT AGCAAGGCTT 
TAACTAGTAG GATAGAAACA 
AGCCTAACCC AGGTTAACTG 
ATGCATAAAG CCAATGTAGT 
TTCAATACAC ACTCATGAAC 
GTGCACACTT GCTAGACTCA 
TGACAACCTA CTTTGCTTGG 
GGACATTTAG TTAGTGCTTT 
ATTTCCAAAT TTTTGTATAG 
AGATGAGGTC CCTGGTTTTT 
ACTAAAACCA TCTACTATAT 
AAGTGTGGGA AGAGACAAAA 



PCT/US02/12476 



CGGTGAACCT 
AGAAGAACTG 
CATGGTCAGA 
CTGATGGGAA 
TCCACACACT 
ACACAGCCAA 
GACGGGCATA 
CTGTGTTTGT 
AAGATCTCCC 
CTACCATTAA 
ATACTGTGAA 
CTGCAGCACC 
CTTCTTTAGG 
GCCAGATTAA 
AGGTTAACAT 
TAATAGACTT 
CTGACCCCAC 
TGTGTCTGCT 
CCCTGGGGGA 
ACCCAGCCTC 
TATTTGTCAC 
AAAATAGTCC 
AAGCCGTGTT 
AAGGAGTTTC 
AGATGTGCTG 
TGGTTTGGGG 
TTATACTGCA 
CTTTTCATTA 
CTGTGTCCCG 
CAAGAAGAGG 
CCAGTTTCTA 
TCCTGATGGA 
GAAAAAATAC 
CTGAGTGAAG 
TTATATACCA 
TCGCTGCACA 
CATGGCAACT 
GTTAGACATG 
AAAAAAAAA 



GATATTCCCT 
CAGAAATGAG 
GGACAGTGAC 
ACCTTTTCCT 
TGGTCAGTAT 
TGTGACACTT 
TGTTCCCATC 
GACTATGTTC 
CATTATGTTT 
CTACAAGTGG 
T CACACGT AT 
AGGACCTTGT 
ACCTGCTGGT 
CAGATATGGG 
CATCCAGATG 
TGTCGTGACC 
CTGCGAGATC 
GACTGTGAGA 
TGACACAAGC 
GCCTTTAAGG 
TGTGATCTCC 
TGGGAATGTG 
CTTCCCGGGA 
TTAAATTTCG 
GAGTGGCTAT 
AAGTTGAATT 
GGCAGCTTCA 
TTTTTTATGT 
AGAGTAAGGA 
CGGGATACTT 
AGATCATGTT 
ACAATAACAG 
TACTCTCATA 
GAATGATATT 
GGCATGATGC 
TATTTGAAAT 
TGATCAGTAA 
ACATTCTTTT 



AGATGCCAAA 
GCTGGTTTAT 
GGGGAAAATG 
CACCACCCCG 
TTCCAGAAAT 
GGGCCTCAAC 
GCACAAGTGA 
CAGAAGAACG 
GATGTCCTGA 
AGCTTCGGGG 
GTGCTCAATG 
CCGCCACCGC 
GACAACCCCC 
CACTTTCAAG 
ACAGACGTCC 
TGCCAAGGGA 
ACCCAGAACA 
CGAACCTTCA 
CTGGCTCTCA 
ATGGCAAACA 
CTCTTGGTGT 
GTCAGAAGCA 
AACCAGGAAA 
ACCTTGTTTC 
TAACCTTTTT 
TTTTATAGGT 
GCCATGTTGT 
TTCACTTATA 
GAGAAGCTAC 
TCAGCTTTCC 
CCAAGCTAAC 
GCCCAAGCCT 
AATGGGTGGG 
CATATATTCA 
TGAGTGACAC 
CATATATTAA 
GGATTTCACC 
TCTCTCCTTC 



AGGAAGATGC 42 0 

CTGCTGATCC 480 

GCACCGGCCA 540 

GATGGAGAAG 600 

TGGGACGATG 660 

TCATGGAAGT 72 0 

AAGATGTGTA 780 

ATCGAAATTC 840 

TTCATGATCC 90 0 

ATAATACTGG 960 

GAACCTTCAG 102 0 

CACCACCACC 10 80 

TGGAGCTGAG 1140 

CCACCATCAC 12 00 

TGATGCCGGT 12 60 

GCATTCCCAC 132 0 

CAGTCTGCAG 13 8 0 

ATGGGTCTGG 1440 

CGAGCACCCT 150 0 

GTGCCCTGAT 1560 

ACAAAAAAC A 162 0 

AAGGCCTGAG 168 0 

AGGATCCGCT 1740 

TGAAGCTCAC 18 0 0 

TTCCTAAAGA 1860 

TAAATGT CAT 192 0 

GAAACTG ATA 198 0 

AAGTCTTAGG 2 04 0 

TATTGATTAG 2100 

ATGTAACTGT 2160 

TGAATCCCAC 222 0 

GTGGTATGAT 22 80 

AGTATTTTGG 2 34 0 

TTTATTCCAT 2 40 0 

TCTTGTGTAT 24 60 

GACTTTCCAA 2520 

TCTGTTTGTA 2580 

CTGAAAAATA 2 640 



Seq ID NO: 383 Protein sequence 
Protein Accession #: NP 002501 



45 



50 



55 



MECLYYFLGF 
VWKRGDMRWK 
RNEAGLSADP 
GQYFQKLGRC 
TMFQKNDRNS 
HTYVIiNGTFS 
RYGHFQATIT 
CEITQNTVCS 
PLRMANSAL I 
FPGNQEKDPL 



11 

I 

LLLAARLPLD 
NSWKGGRVQA 
YVYNWTAWSE 
SVRVSVNTAN 
SDETFLKDLP 
LNLTVKAAAP 
IVEGILEVNI 
PVDVDEMCLIj 
SVGCLAIFVT 
LKNQEFKGVS 



21 
I 

AAKRFHDVLG 
VLTSDSPALV 
DSDGENGTGQ 
VTLGPQLMEV 
IMFDVLIHDP 
GPCPPPPPPP 
IQMTDVLMPV 
TVRRTFNGSG 
VISLIiVYKKH 



31 

i 

NERPSAYMRE 
GSNITFAVNLt 
SHHNVFPDGK 
TVYRRHGRAY 
SHFLNYSTIN 
RPSKPTPSLG 
PWPESSLIDF 
TYCVNLTLGD 
KEYNPIENSP 



41 

I 

HNQLNGWSSD 
IFPRCQKEDA 
PFPHHPGWRR 
VPIAQVKDVY 
YKWSFGDNTG 
PAGDNPLELS 
WTCQGSIPT 
DTSLALTSTL 
GNWRSKGLS 



51 



ENDWNEKLYP 60 

NGNIVYEKNC 12 0 

WNFIYVFHTL 180 

WTDQIPVFV 240 

LFVSTNHTVN 3 00 

RIPDENCQIN 360 

EVCTIISDPT 42 0 

ISVPDRDPAS 480 

VFLNRAKAVF 540 



60 



Seq ID NO: 3 84 DNA sequence 
Nucleic Acid Accession #: NM_001134 
Coding sequence: 48-1877 



65 



70 



75 



80 



85 



TCCATATTGT 
AATCAATTTT 
AATATGGAAT 
ACCTGGCTAC 
AAATGGTGAA 
GGTGTTTAGA 
TGGAGAAGTA 
TTCTTGCACA 
TCACAAGCTG 
AGATAGCAAG 
ATGACAAAAT 
AGGCAGCAAC 
CAGTAATGAA 
AGAAGTTTAC 
TACATGAGCA 
TGTCCTACAT 
TGACCACGCT 
GTCTATCTCC 
GGGAAAAAAA 
TTGCTGTCTC 
TCCAGACTGA 
TCCAGGAGAG 
ATTACTTACA 
CGGAGCTGAT 
GTGAGGACAA 



11 
I 

GCTTCCACCA 
TTTAATTTTC 
AGCTTCCATA 
CATATTTTTT 
AGATGCATTG 
AAACCAG CTA 
CGGACATTCA 
CAAAAAGCCC 
TGAAGCATAT 
AAGGCATCCC 
AATTCCATCT 
AGTTACAAAA 
AAATTTTGGG 
CAAAGTTAAT 
CTGTTGCAGA 
ATGTTCTCAA 
GGAACGTGGT 
AAATCTAAAC 
TATCTTCTTG 
AGTAATTCTA 
AAACCCTCTT 
CCAAGCATTG 
AAATGCGTTT 
GGCCATCACC 
ACTATTGGCC 



21 
1 

CTGCCAATAA 
CTACTAAATT 
TTGGATTCTT 
GCCCAGTTTG 
ACTGCAATTG 
CCTGCCTTTC 
GACTGCTGCA 
ACTCCAGCAT 
GAAGAAGACA 
TTCCTGTATG 
TGCTGCAAAG 
GAATTAAGAG 
ACCCGAACTT 
TTTACTGAAA 
GGAGATGTGC 
CAAGACACTC 
CAATGTATAA 
AGGTTTTTAG 
GCAAGTTTTG 
AGAGTTGCTA 
GAATGCCAAG 
GCAAAGCGAA 
CTCGTTGCTT 
AGAAAAATGG 
TGTGGCGAGG 



31 
1 

CAAAATAACT 
TTACTGAATC 
ACCAATGTAC 
TT CAAGAAGC 
AGAAACCCAC 
TGGAAGAACT 
GCCAAAGTGA 
CGATCCCACT 
GGGAGACATT 
CACCTACAAT 
CTGAAAATGC 
AAAGCAGCTT 
TCCAAGCCAT 
TCCAGAAACT 
TGGATTGTCT 
TGTCAAACAA 
TTCATGCAGA 
GAGATAGAGA 
TT CATGAATA 
AAGGATACCA 
ATAAAGGAGA 
GCTGCGGCCT 
ACACAAAGAA 
CAGCCACAGC 
GAGCGGCTGA 



41 
I 

AG CAAC CATG 
CAGAACACTG 
TG CAG AG AT A 
CACTTACAAG 
TGGAGATGAA 
TTGCCATGAG 
AGAGGGAAGA 
TTTCCAAGTT 
CATGAACAAA 
TCTTCTTTGG 
AGTTGAATGC 
GTTAAATCAA 
AACTGTTACT 
AGTCCTGGAT 
GCAGGATGGG 
AATAACAGAA 
AAATGATGAA 
TTTTAACCAA 
TTCAAGAAGA 
GGAGTTATTG 
AGAAGAATTA 
CTTCCAGAAA 
AGCCCCCCAG 
AGCCACTTGT 
CATTATTATC 



51 
I 

AAGTGGGTGG 60 

CATAGAAATG 120 

AGTTTAGCTG 180 

GAAGTAAGCA 240 

CAGTCTTCAG 3 00 

AAAGAAATTT 3 60 

CATAACTGTT 420 

CCAGAACCTG 480 

TTCATTTATG 540 

GCTGCTCGCT 600 

TTCCAAACAA 660 

CATGCATGTG 720 

AAACTGAGTC 780 

GTGGCCCATG 840 

GAAAAAATCA 90 0 

TGCTGCAAAC 960 

AAACCTGAAG 1020 

TTTTCTTCAG 1080 

CATCCTCAGC 1140 

GAGAAGTGTT 12 00 

CAGAAATACA 12 60 

CTAGGAGAAT 1320 

CTGACCTCGT 13 80 

TGCCAACTCA 1440 

GGACACTTAT 1500 



328 



10 



WO 02/086443 

GTATCAGACA TGAAATGACT 
ATGCCAACAG GAGGCCATGC 
CATTCTCTGA TGACAAGTTC 
TGCAAACGAT GAAGCAAGAG 
AGGAACAACT TGAGGCTGTC 
GCCAGGAACA GGAAGTCTGC 
CTGCTTTGGG AGTTTAAATT 
TGTGAACTTT TCTCTTTAAT 
AAAGACTTTT ATGTGAGATT 
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CCAGTAAACC 
TTCAGCAGCT 
ATTTTCCATA 
TTTCTCATTA 
ATTGCAGATT 
TTTGCTGAAG 
ACTTCAGGGG 
TTTAACTGAT 
TCCTTATCAC 



CTGGTGTTGG 
TGGTGGTGGA 
AGGATCTGTG 
ACCTTGTGAA 
TCTCAGGCCT 
AGGGACAAAA 
AAGAGAAGAC 
TTAACACTTT 
AGAAATAAAA 



CCAGTGCTGC 
TGAAACATAT 
CCAAGCTCAG 
GCAAAAGCCA 
GTTGGAGAAA 
ACTGATTTCA 
AAAACGAGTC 
TTGTGAATTA 
TATCTCCAAA 



ACrrCTTCAT 1560 

GTCCCTCCTG 1620 

GGTGTAGCGC 1680 

CAAAT AACAG 1740 

TGCTGCCAAG 1800 

AAAACT CGTG 1860 

TTTCATTCGG 1920 

ATGAAATGAT 1980 
TG 



Seq ID NO: 385 Protein sequence 
Protein Accession #: NP 001125 



15 



20 



25 



MKWVESIFLI 
KEVS KMVKD A 
RHNCFLAHKK 
WAARYDKIIP 
TKLSQKFTKV 
ECCKLTTLER 
RHPQLAVSVI 
KLGEYYLQNA 
IGHLCIRHEM 
QGVALQTMKQ 
SKTRAALGV 



11 
I 

FLLNFTESRT 

LTAIEKPTGD' 

PTPASIPLFQ 

SCCKAENAVE 

NFTEIQKLVL 

GQCIIHAEND 

LRVAKGYQEL 

FLVAYTKKAP 

TPVNPGVGQC 

EFLINLVKQK 



21 



LHRNEYGIAS 
EQSSGCLENQ 
VPEPVTSCEA 
CFQTKAATVT 
DVAHVHEHCC 
EKPEGLSPNL 
LEKCFQTENP 
QLTSSELMAI 
CTSSYANRRP 
PQITEEQL.EA 



31 
I 

ILDSYQCTAE 
LPAFLEELCH 
YEEDRETFMN 
KELRESSLLN 
RGDVLDCLQD 
NRFLGDRDFN 
LECQDKGEEE 
TRKMAATAAT 
CFSSLWDET 
VIADFSGLLE 



41 
I 

ISLADLATIF 
EKEILEKYGH 
KFIYEIARRH 
QHACAVMKNF 
GEKIMSYICS 
QFSSGEKNIF 
LQKYIQESQA 
CCQLSEDKLL 
YVPPAFSDDK 
KCCQGQEQEV 



51 
I 

FAQFVQEATY 60 

SDCCSQSEEG 120 

PFLtYAPTILiIi 180 

GTRTFQAITV 240 

QQDTLSNKIT 3 00 

LASFVHEYSR 3 60 

LAKRSCGLFQ 420 

ACGEGAAD I I 480 

FIFHKDLCQA 540 

CFAEEGQKLI 600 



30 



Seq ID NO: 386 DNA sequence 

Nucleic Acid Accession #: NM_ 002205.1 

Coding sequence: 1..3149 



11 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



ATGGGGAGCC 
CGCCGACCCC 
GGCTTCAACT 
GGATTCTCAG 
CCCAAGGCTA 
TGGGGTGCCA 
CTGGAGTCCT 
TGGTTCGGGG 
AGCTGGCGCA 
GATAACTTCA 
GGACAGGGTT 
TTAGGTGGAC 
ATTGCAGAAT 
CGCCAGGCCA 
TTCAGTGGTG 
GGCTATGTCA 
CAGATGGCCT 
GATGACTTGC 
GAGGTGGGCA 
CTTACCCTCA 
GACCTGGACC 
CAGCAGGGAG 
CAGGTTCTGC 
CGAGGAGGCC 
GTGGACAAGG 
ATCTTCCCCG 
GCCTGCATCA 
GGTTTCACAG 
CTGTTCCTGG 
CGAGAGGATT 
CTCTCGCCGA 
CACGGCCTCA 
ATCTTGCTGG 
GGGGAGCAGA 
CAGAATGTGG 
GCTGAGTACT 
TTTGCCGTGA 
GCCAGTCTGT 
ATCCAGTTTG 
TCCTTTCGGC 
GAGGCAGTGC 
GACCTGGGAC 
AGCCAGGGTG 
GTGACCAGAG 
GAGTTGGATC 
TCTGCTTCCT 
TGTGAGCTCG 
TGGG CCAAGA 
TACAAAGCCC 
CAGGTGGCCA 
AT CAT CATCC 
TACAAGCTTG 
CTCAAGCCTC 



GGACGCCAGA 
CGCTSSTGCC 
TAGACGCGGA 
TGGAGTTTTA 
ATACC AG CCA 
GCCCCACACA 
CACTGTCCAG 
CAACAGTTCG 
CAGAGAAGGA 
CCCGAATTCT 
ACTGCCAAGG 
CAGGAAGCTA 
CTTATTACCC 
GTTCCATCTA 
ATGACACAGA 
CCATCCTTAA 
CCTACTTTGG 
TGGTGGGGGC 
GGGTCTACGT 
CTGGCCATGA 
AGGATGGCTA 
TAGTGTTTGT 
AGCCCCTGTG 
GAGACCTGGA 
CTGTGGTATA 
CCATGTTCAA 
ACCTTAGCTT 
TGGAACTTCA 
CCTCCAGGCA 
GCAGAGAGAT 
TTCACATCGC 
GGCCAGCCCT 
ACTGTGGAGA 
ACCATGTGTA 
GTGAGGGTGG 
CAGGACTCGT 
ACCAGAGCCG 
GGGGTGGCCT 
ACTTCCAGAT 
TCTCCGTGGA 
TATTCCCAGT 
CTGCTGTCCA 
TGCTGGAACT 
TTACGGGACT 
CCGAGGGTTC 
CGGGACCTCA 
GGCCCCTGCA 
CTTTCTTGCA 
TGAAGATGCC 
CAGCTGTGCA 
TAGCCAT CCT 
GATTCTTCAA 
CAGCCACCTC 



21 
I 

GTCCCCTCTC 
GCTGCTGTTG 
GGCCCCAGCA 
CCGGCCGGGA 
GCCAGGAGTG 
GTGCACCCCC 
CTCAGAGGGA 
AGCCCATGGC 
GCCACTGAGC 
GGAGTATGCA 
AGGCTTCAGT 
TTTCTGGCAA 
CGAGTACCTG 
TGATGACAGC 
AGACTTTGTT 
TGGCTCAGAC 
CTATGCAGTG 
ACCCCTGCTC 
CTACCTGCAG 
TGAGTTTGGC 
CAATGATGTG 
ATTTCCTGGG 
GGCAGCCAGC 
TGGCAATGGA 
CAGGGGCCGC 
CCCAGAGGAG 
CTGCCTCAAT 
GCTGGACTGG 
GGCAACCCTG 
GAAGATCTAC 
TCTCAACTTC 
ACATTATCAG 
AGACAACATC 
CCTGGGTGAC 
CGCCTATGAG 
CAGACACCCA 
CCTGCTGGTG 
TCGGTTTACA 
CCTCAGCAAG 
GGCTCAGGCC 
AAGCGACTGG 
CCATGTCTAT 
CAGCTGTCCC 
CAACTGCACC 
CCTGCACCAC 
GAT CCTGAAA 
CCAACAAGAG 
GCGGGAGCAC 
CTACCGAATC 
ATGGACCAAG 
GTTTGGCCTC 
ACGCTCCCTC 
TGATGCCTGA 



31 

I 

CACGCCGTGC 
CTGCTSSTGC 
GTACTCTCGG 
ACAGACGGGG 
CTGCAGGGTG 
ATTGAATTTG 
GAGGAGCCTG 
TCCTCCATCT 
GACCCCGTGG 
CCCTGCCGCT 
GCCGAGTTCA 
GGCCAGATCC 
ATCAACCTGG 
TACCTAGGAT 
GCTGGTGTGC 
ATTCGATCCC 
GCCGCCACAG 
ATGGATCGGA 
CACCCAGCCG 
CGATTTGGCA 
GCCAT CGGGG 
GGCCCAGGAG 
CACACCCCAG 
TATCCTGATC 
CCCATCGTGT 
CGGAGCTGCA 
GCTTCTGGAA 
CAGAAGCAGA 
ACCCAGACCC 
CTCAGGAACG 
TCCTTGGACC 
AGCAAGAGCC 
TGTGTGCCTG 
AAGAATGCCC 
GCTGAGCTTC 
GGGAACTTCT 
TGTGACCTGG 
GTCCCTCATC 
AATCTCAACA 
CAGGTCACCC 
CATCCCCGAG 
GAG CTCATCA 
CAGGCTCTGG 
ACCAATCACC 
CAGCAAAAAC 
TGCCCGGAGG 
AGCCAAAGTC 
CAGCCATTTA 
CTGCCTCGGC 
GCAGAAGGCA 
CTGCTCCTAG 
CCATATGGCA 



41 

I 

AGCTGCGCTG 
CGCCGCCACC 
GGCCCCCGGG 
TCAGTGTGCT 
GTGCTGTCTA 
ACAGCAAAGG 
TGGAGTACAA 
TGGCATGCGC 
GCACCTGCTA 
CAGATTTCAG 
CCAAGACTGG 
TGTCTGCCAC 
TTCAGGGGCA 
ACTCTGTGGC 
CCAAAGGGAA 
TCTACAACTT 
ACGTCAATGG 
CCCCTGACGG 
GCATAGAGCC 
GCTCCTTGAC 
CTCCCTTTGG 
GGCTGGGCTC 
ACTTCTTTGG 
TGATTGTGGG 
CCGCTAGTGC 
GCTTAGAGGG 
AACACGTTGC 
AGGGAGGGGT 
TGCTCATCCA 
AGTCAGAATT 
CCCAAGCCCC 
GGATAGAGGA 
ACCTGCAGCT 
TGAACCTCAC 
GGGTCACCGC 
CCAGCCTGAG 
GCAACCCCAT 
TCCGGGACAC 
ACTCGCAAAG 
TGAACGGTGT 
ACCAGCCTCA 
ACCAAGGCCC 
AAGGTCAGCA 
CCATTAACCC 
GGGAAGCTCC 
CTGAGTGTTT 
TGCAGTTGCA 
GCCTGCAGTG 
AGCTGCCCCA 
GCTATGGCGT 
GTCTACTCAT 
CCGCCATGGA 



51 

I 

GGGCCCCCGG 60 

CAGGGTCGGG 120 

CTCCTTCTTC 180 

GGTGGGAGCA 240 

CCTCTGTCCT 300 

CTCTCGGCTC 3 60 

GTCCTTGCAG 420 

TCCACTGTAC 480 

CCTCTCCACA 540 

CTGGGCAGCA 600 

CCGTGTGGTT 660 

TCAGGAGCAG 72 0 

GCTGCAGACT 780 

TGTTGGTGAA 840 

CCTCACTTAC 900 

CTCAGGGGAA 960 

GGACGGGCTG 1020 

GCGGCCTCAG 1080 

CACGCCCACC 1140 

CCCCCTGGGG 1200 

TGGGGAGACC 12 60 

TAAGCCTTCC 132 0 

CTCTGCCCTT 13 80 

GTCCTTTGGT 1440 

CTCCCTCACC 1500 

GAACCCTGTG 1560 

TGACTCCATT 162 0 

ACGGCGGGCA 1680 

GAATGGGGCT 1740 

TCGAGACAAA 1800 

AGTGGACAGC 1860 

CAAGGCTCAG 192 0 

GGAAGTGTTT 1980 

TTTCCATGCC 2040 

CCCTCCAGAG 2100 

CTGTGACTAC 2160 

GAAGGCAGGA 2220 

TAAGAAAACC 22 80 

CGACGTGGTT 2 340 

CTCCAAGCCT 2400 

GAAGGAGGAG 2460 

CAGCTCCATT 2520 

GCTCCTATAT 2580 

AAAGGGCCTG 2 640 

AAGCCGCAGC 2700 

CAGGCTGCGC 2760 

TTTCCGAGTC 2820 

TGAGGCTGTG 2880 

AAAAGAGCGT 2 940 

CCCACTGTGG 3000 

CTACATCCTC 3 060 

AAAAGCTCAG 312 0 



329 



WO 02/086443 



Seq ID NO: 387 Protein sequence 
Protein Accession #: NP_002 196.1 

1 11 21 31 41 51 

I i I I 1 1 

MGSRTPESPL HAVQLRWGPR RRPPLLPLLL LLLPPPPRVG GFNLDAEAPA VLSGPPGSFF 

GFSVEFYRPG TDGVSVLVGA PKANTSQPGV LQGGAVYLCP WGASPTQCTP IEFDSKGSRL 

LESSLSSSEG EEPVEYKSLQ WFGATVRAHG SSILACAPLY SWRTEKEPLS DPVGTCYLST 

DNFTR I LEY A PCRSDFSWAA GQGYCQGGFS AEFTKTGRW LGGPGSYFWQ GQIIiSATQEQ 

IAESYYPEYL 'INLVQGQLQT RQASSIYDDS YLGYSVAVGE FSGDDTEDFV AGVPKGNLTY 

GYVTILNGSD IRSLYNFSGE QMASYFGYAV AATDVNGDGL DDLLVGAPLL MDRTPDGRPQ 

EVGRVYVYLQ HPAGIEPTPT LTLTGHDEFG RFGSSLTPLG DLDQDGYNDV AIGAPFGGET 

QQGWFVFPG GPGGLGSKPS QVLQPLWAAS HTPDFFGSAL RGGRDLDGNG YPDLIVGSFG 

VDKAWYRGR PIVSASASLT IFPAMFNPEE RSCSLEGNPV ACINLSFCLN ASGKHVAD S I 

GFTVELQLDW QKQKGGVRRA LFLASRQATL TQTLLIQNGA REDCREMKIY LRNES EFRDK 

LSPIHIALNF SLDPQAPVDS HGLRPALHYQ SKSRIEDKAQ ILLDCGEDNI CVPDLQLEVF 

GEQNHVYLGD KNALNLTFHA QNVGEGGAYE AELRVTAPPE AEYSGLVRHP GNFSSLSCDY 

FAVNQSRLLV CDLGNPMKAG ASLWGGLRFT VPHLRDTKKT IQFDFQILSK NLNNSQSDW 

SFRLSVEAQA QVTLNGVSKP EAVLFPVSDW HPRDQPQKEE DLGPAVHHVY ELINQGPSSI 

SQGVLELSCP QALEGQQLLY VTRVTGLNCT TNHPINPKGL ELD PEGS LHH QQKREAPSRS 

SASSGPQILK CPEAECFRLR CELGPLHQQE SQSLQLHFRV WAKTFLQREH QPFSLQCEAV 

YKALKMP YR I LPRQLPQKER QVATAVQWTK AEGSYGVPLW IIILAILFGL LLLGLLIYIL 

YKLGFFKRSL PYGTAMEKAQ LKPPATSDA 

Seq* ID NO: 388 DNA sequence 

Nucleic Acid Accession #: NM_002425 

Coding sequence: 26.. 1453 

1 11 21 31 41 51 

l I I l I I 

AAAGAAGGTA AGGGCAGTGA GAATGATGCA TCTTGCATTC CTTGTGCTGT TGTGTCTGCC 
AGTCTGCTCT GCCTATCCTC TGAGTGGGGC AGCAAAAGAG GAGGACTCCA ACAAGGATCT 
TGCCCAGCAA TACCTAGAAA AGTACTACAA CCTCGAAAAG GATGTGAAAC AGTT TAGAAG 
AAAGGACAGT AATCTCATTG TTAAAAAAAT CCAAGGAATG CAGAAGTTCC TTGGGTTGGA 
GGTGACAGGG AAGCTAGACA CTGACACTCT GGAGGTGATG CGCAAGCCCA GGTGTGGAGT 
TCCTGACGTT GGTCACTTCA GCTCCTTTCC TGGCATGCCG AAGTGGAGGA AAACCCACCT 
TACATACAGG ATTGTGAATT ATACACCAGA TTTGCCAAGA GATGCTGTTG ATTCTGCCAT 
TGAGAAAGCT CTGAAAGTCT GGGAAGAGGT GACTCCACTC ACATTCTCCA GGCTGTATGA 
AGGAGAGGCT GATATAATGA TCTCTTTCGC AGTTAAAGAA CATGGAGACT TTTACTCTTT 
TGATGGCCCA GGACACAGTT TGGCTCATGC CTACCCACCT GGACCTGGGC TTTATGGAGA 
TATTCACTTT GATGATGATG AAAAAT GG AC AGAAGATGCA TCAGGCACCA ATTTATTCCT 
CGTTGCTGCT CATGAACTTG GCCACTCCCT GGGGCTCTTT CACTCAGCCA ACACTGAAGC 
TTTGATGTAC CCACTCTACA ACTCATTCAC AGAGCTCGCC CAGTTCCGCC TTTCGCAAGA 
TGATGTGAAT GGCATTCAGT CTCTCTACGG ACCTCCCCCT GCCTCTACTG AGGAACCCCT 
GGTGCCCACA AAATCTGTTC CTTCGGGATC TGAGATGCCA GCCAAGTGTG ATCCTGCTTT 
GTCCTTCGAT GCCATCAGCA CTCTGAGGGG AGAATATCTG TTCTTTAAAG ACAGATATTT 
TTGGCGAAGA TCCCACTGGA ACCCTGAACC TGAATTTCAT TTGATTTCTG CATTTTGGCC 
CTCTCTTCCA TCATATTTGG ATGCTGCATA TGAAGTTAAC AGCAGGGACA CCGTTTTTAT 
TTTTAAAGGA AATGAGT TCT GGGCCATCAG AGGAAATGAG GTACAAGCAG GTTATCCAAG 
AGGCATCCAT ACCCTGGGTT TTCCTCCAAC CATAAGGAAA ATTGATGCAG CTGTTTCTGA 
CAAGGAAAAG AAGAAAACAT ACTTCTTTGC AGCGGACAAA TACTGGAGAT TTGATGAAAA 
TAGCCAGTCC ATGGAGCAAG GCTTCCCTAG ACTAATAGCT GATGACTTTC CAGGAGTTGA 
GCCTAAGGTT GATGCTGTAT TACAGGCATT TGGATTTTTC TACTTCTTCA GTGGATCATC 
ACAGTTTGAG TTTGACCCCA ATGCCAGGAT GGTGACACAC ATATTAAAGA GTAACAGCTG 
GTTACATTGC TAGG CGAGAT AGGGGGAAGA CAGATATGGG TGTTTTTAAT AAATCTAATA 
ATTATTCATC TAATGTATTA TGAGCCAAAA TGGTTAATTT TTCCTGCATG TTCTGTGACT 
GAAGAAGATG AGCCTTGCAG ATATCTGCAT GTGTCATGAA GAATGTTTCT GGAATTCTTC 
ACTTGCTTTT GAATTGCACT GAACAGAATT AAGAAATACT CATGTGCAAT AGGTGAGAGA 
ATGTATTTTC ATAGATGTGT TATTACTTCC TCAATAAAAA GTTTTATTTT GGGCCTGTTC 
CTT 

Seq ID NO: 389 Protein sequence 
Protein Accession #: NP_002416 

1 11 21 31 41 51 

I I I I I i 

MHLAFLVLLC LPVCSAYPLS GAAKEED SNK DLAQQYLEKY YNLEKDVKQF RRKDSNLIVK 

KIQGMQKFLG LEVTGKLDTD TLEVMRKPRC GVPDVGHFSS FPGMPKWRKT HLTYRIVNYT 

PDLPRDAVDS AIEKALKVWE EVTPLTFSRL YEGEADIMIS FAVKEHGDFY SFDGPGHSLA 

HAYPPGPGLY GDIHFDDDEK WTEDASGTNL FLVAAHELGH SLGLFHSANT EALMYPLYNS 

FTELAQFRLS QDDVNGIQSL YGPPPASTEE PLVPTKSVPS GSEMPAKCDP ALSFDAISTL 

RGEYLFFKDR YFWRRSHWNP EPEFHLISAF WPSLPSYLDA AYEVNSRDTV F I FKGNEFWA 

IRGNEVQAGY PRGIHTLGFP PT I RKIDAAV SDKEKKKTYF FAADKYWRFD ENSQSMEQGF 

PRLIADDFPG VEPKVDAVLQ AFGFFYFFSG SSQFEFDPNA RMVTHILKSN SWLHC 

Seq ID NO: 390 DNA sequence 

Nucleic Acid Accession #: NM_002421.2 

Coding sequence: 1..140 9 

1 11 21 31 41 51 

l I l I I l 

ATGCACAGCT TTCCTCCACT GCTGCTGCTG CTGTTCTGGG GTGTGGTGTC ACACAGCTTC 

CCAGCGACTC TAGAAACACA AGAGCAAGAT GTGGACTTAG TCCAGAAATA CCTGGAAAAA 

TACTACAACC TGAAGAATGA TGGGAGGCAA GTTGAAAAGC GGAGAAATAG TGGCCCAGTG 

GTTGAAAAAT TGAAGCAAAT GCAGGAATTC TTTGGGCTGA AAGTGACTGG GAAACCAGAT 

GCTGAAACCC TGAAGGTGAT GAAGCAGCCC AGATGTGGAG TGCCTGATGT GGCTCAGTTT 



330 



10 



15 



20 



WO 02/086443 

GTCCTCACTG AGGGGAACCC 
TACACGCCAG ATTTGCCAAG 
TGGAGTAATG TCACACCTCT 
ATATCTTTTG TCAGGGGAGA 
CTTGCTCATG CTTTTCAACC 
GAAAGGTGGA CCAACAATTT 
GGCCATTCTC TTGGACTCTC 
ACCTTCAGTG GTGATGTTCA 
GGACGTTCCC AAAATCCTGT 
AAGCTAACCT TTGATGCTAT 
TTCTACATGC GCACAAATCC 
TGGCCACAAC TGCCAAATGG 
CGGTTTTTCA AAGGGAATAA 
CCCAAGGACA TCTACAGCTC 
CTTTCTGAGG AAAACACTGG 
GATGAATATA AACGATCTAT 
GGAATTGGCC ACAAAGTTGA 
GGAACAAGAC AATACAAATT 
AATAGCTGGT TCAACTGCAG 



PCT/US02/12476 



TCGCTGGGAG 
AGCAGATGTG 
GACATTCACC 
T CATCGGG AC 
AGGCCCAGGT 
CAGAGAGTAC 
CCATT CTACT 
GCTAGCTCAG 
CCAGCCCATC 
AACTACGATT 
CTTCTACCCG 
GCTTGAAGCT 
GTACTGGGCT 
CTTTGGCTTC 
AAAAACCTAC 
GGATCCAGGT 
TGCAGTTTTC 
TGATCCTAAA 
GAAAAATTAG 



CAAACAC AT C 
GACCATGCCA 
AAGGTCTCTG 
AACT CTCCTT 
ATTGGAGGGG 
AACTTACATC 
GATATCGGGG 
GATGACATTG 
GGCCCACAAA 
CGGGGAGAAG 
GAAGTTGAGC 
GCTTACGAAT 
GTTCAGGGAC 
CCTAGAACTG 
TTCTTTGTTG 
TAT CCCAAAA 
ATGAAAGATG 
ACGAAGAGAA 



TGACCTACAG 
TTGAGAAAGC 
AGGGTCAAGC 
TTGATGGACC 
ATGCTCATTT 
GTGTTGCGGC 
CTTTGATGTA 
ATGGCATCCA 
CCCCAAAAGC 
TGATGTTCTT 
TCAATTTCAT 
TTGCCGACAG 
AGAATGTGCT 
T G AAG CAT AT 
CTAACAAATA 
TGATAGCACA 
GATTTTTCTA 
TTTTGACTCT 



GATTGAAAAT 360 

CTTCCAACTC 42 0 

AGACAT CATG 480 

TGGAGGAAAT 540 

TGATGAAGAT 600 

TCATGAACTC 660 

CCCTAGCTAC 72 0 

AGCCATATAT 780 

ATGTGACAGT 840 

TAAAGACAGA 900 

TTCTGTTTTC 960 

AGATGAAGTC 102 0 

ACACGGATAC 1080 

CGATGCTGCT 1140 

CTGGAGGTAT 12 00 

TGACTTTCCT 12 60 

TTTCTTTCAT 132 0 

CCAGAAAGCT 13 80 



Seq ID NO: 3 91 Protein sequence 
Protein Accession #: NP 002412.1 



25 



30 



35 



I 

MHSFPPLLLL 
VEKLKQMQEF 
YTPDLPRADV 
LAHAFQPGPG 
TFSGDVQLAQ 
FYMRTNPFYP 
PKDIYSSFGF 
GIGHKVDAVF 



11 



LFWGWSHSF 
FGLKVTGKPD 
DHAI EKAFQL 
IGGDAHFDED 
DDIDGIQAIY 
EVELNFISVF 
PRTVKH I DAA 
MKDGFFYFFH 



21 
I 

PATLETQEQD 
AETLKVMKQP 
WSNVTPLTFT 
ERWTNNFREY 
GRSQNPVQPI 
WPQLPNGLEA 
LSEENTGKTY 
GTRQYKFDPK 



31 

I 

VDLVQKYLEK 
RCGVPDVAQF 
KVSEGQADIM 
NLHRVAAHEL 
GPQTPKACDS 
AYEFADRDEV 
FFVANKYWRY 
TKRILTLQKA 



41 



YYNLKNDGRQ 
VLTEGNPRWE 
ISFVRGDHRD 
GHSLGLSHST 
KLTFDAITTI 
RFFKGNKYWA 
DEYKRSMDPG 
NSWFNCRKN 



51 
I 

VEKRRNSGPV 60 

QTHLTYRIEN 12 0 

NSPFDGPGGN 180 

DIGALMYPSY 240 

RGEVMFFKDR 3 00 

VQGQNVLHGY 3 60 

YPKMIAHDFP 420 



Seq ID NO: 3 92 DNA sequence 

Nucleic Acid Accession #: NM_0 02421.2 

Coding sequence: 1..1409 



40 



45 



50 



55 



60 



65 



ATGCACAGCT 
CCAGCGACTC 
TACTACAACC 
GTTGAAAAAT 
GCTGAAACCC 
GTCCTCACTG 
TACACGCCAG 
TGGAGTAATG 
ATATCTTTTG 
CTTGCTCATG 
GAAAGGTGGA 
GGCCATTCTC 
ACCTTCAGTG 
GGACGTTCCC 
AAGCTAACCT 
TTCTACATGC 
TGGCCACAAC 
CGGTTTTTCA 
CCCAAGGACA 
CTTTCTGAGG 
GATGAATATA 
GGAATTGGCC 
GGAACAAGAC 
AATAGCTGGT 



11 

I 

TTCCTCCACT 
TAGAAACACA 
TGAAGAATGA 
TGAAGCAAAT 
TGAAGGTGAT 
AGGGGAACCC 
ATTTGCCAAG 
TCACACCTCT 
TCAGGGGAGA 
CTTTTCAACC 
CCAACAATTT 
TTGGACTCTC 
GTGATGTTCA 
AAAATCCTGT 
TTGATGCTAT 
GCACAAATCC 
TGCCAAATGG 
AAGGGAATAA 
TCTACAGCTC 
AAAACACTGG 
AACGATCTAT 
ACAAAGTTGA 
AATACAAATT 
TCAACTGCAG 



21 
1 

GCTGCTGCTG 
AGAGCAAGAT 
TGGGAGGCAA 
GCAGGAATTC 
GAAGCAGCCC 
TCGCTGGGAG 
AGCAGATGTG 
GACATTCACC 
T CAT CGGGAC 
AGGCCCAGGT 
CAGAGAGTAC 
CCATT CTACT 
GCTAGCTCAG 
CCAGCCCATC 
AACTACGATT 
CTTCTACCCG 
GCTTGAAGCT 
GTACTGGGCT 
CTTTGGCTTC 
AAAAACCTAC 
GGATCCAGGT 
TGCAGTTTTC 
TGATCCTAAA 
GAAAAATTAG 



31 



CTGTTCTGGG 
GTGGACTTAG 
GTTGAAAAGC 
TTTGGGCTGA 
AGATGTGGAG 
CAAACAC AT C 
GACCATGCCA 
AAGGTCTCTG 
AACTCTCCTT 
ATTGGAGGGG 
AACTTACATC 
GATATCGGGG 
GATGACATTG 
GGCCCACAAA 
CGGGGAGAAG 
GAAGTTGAGC 
GCTTACGAAT 
GTTCAGGGAC 
CCTAGAACTG 
TTCTTTGTTG 
TATCCCAAAA 
ATGAAAGATG 
ACGAAGAGAA 



41 

GTGTGGTGT C 
TCCAGAAATA 
GGAGAAATAG 
AAGTGACTGG 
TGCCTGATGT 
TGACCTACAG 
TTGAGAAAGC 
AGGGTCAAGC 
TTGATGGACC 
ATGCTCATTT 
GTGTTGCGGC 
CTTTGATGTA 
ATGGCATCCA 
CCCCAAAAGC 
TGATGTTCTT 
TCAATTTCAT 
TTGCCGACAG 
AGAATGTGCT 
TGAAGCATAT 
CTAACAAATA 
TGATAGCACA 
GATTTTTCTA 
TTTTGACTCT 



51 
I 

ACACAGCTTC 60 

CCTGGAAAAA 12 0 

TGGCCCAGTG 18 0 

GAAACCAGAT 240 

GGCTCAGTTT 300 

GATTGAAAAT 360 

CTTCCAACTC 420 

AGACATCATG 480 

TGGAGGAAAT 540 

TGATGAAGAT 600 

TCATGCCCTC 660 

CCCTAGCTAC 720 

AGCCATATAT 780 

ATGTGACAGT 840 

TAAAGACAGA 900 

TTCTGTTTTC 960 

AGATGAAGTC 1020 

ACACGGATAC 10 8 0 

CGATGCTGCT 1140 

CTGGAGGTAT 120 0 

TGACTTTCCT 1260 

TTTCTTTCAT 132 0 

CCAGAAAGCT 1380 



70 



75 



80 



Seq ID NO: 3 93 Protein sequence 
Protein Accession #: NP 002412.1 



MHSFPPLLLL 
VEKLKQMQEF 
YTPDLPRADV 
LAHAFQPGPG 
TFSGDVQLAQ 
FYMRTNPFYP 
PKDIYSSFGF 
GIGHKVDAVF 



11 

I 

LFWGWSHSF 
FGLKVTGKPD 
DHAIEKAFQL 
IGGDAHFDED 
DDIDGIQAIY 
EVELNFISVF 
PRTVKH IDAA 
MKDGFFYFFH 



21 



PATLETQEQD 
AETLKVMKQP 
WSNVTPLTFT 
ERWTNNFREY 
GRSQNPVQPI 
WPQLPNGLEA 
LSEENTGKTY 
GTRQYKFDPK 



31 



VDLVQKYLEK 
RCGVPDVAQF 
KVSEGQADIM 
NLHRVAAHAL 
GPQTPKACDS 
AYEFADRDEV 
FFVANKYWRY 
TKRILTLQKA 



41 



51 



YYNLKNDGRQ 
VLTEGNPRWE 
ISFVRGDHRD 
GHSLGLSHST 
KLTFDAITTI 
RFFKGNKYWA 
DEYKRSMDPG 
NSWFNCRKN 



VEKRRNSGPV 60 

QTHLTYRIEN 120 

NSPFDGPGGN 180 

DIGALMYPSY 240 

RGEVMFFKDR 300 

VQGQNVLHGY 360 

YPKMIAHDFP 42 0 



85 



Seq ID NO: 3 94 DNA sequence 

Nucleic Acid Accession #: NM__014331.2 

Coding sequence: 1..1506 



1 
I 



11 



21 



31 



41 



51 



331 



WO 02/086443 PCT/US02/12476 

ATGGTCAGAA AGCCTGTTGT GTCCACCATC TCCAAAGGAG GTTACCTGCA GGGAAATGTT 60 

AACGGGAGGC TGCCTTCCCT GGG CAACAAG GAGCCACCTG GGCAGGAGAA AGTGCAGCTG 120 

AAGAGGAAAG TCACTTTACT GAGGGGAGTC TCCATTATCA TTGGCACCAT CATTGGAGCA 180 

GGAATCTTCA TCTCTCCTAA GGGCGTGCTC CAGAACACGG GCAG CGTGGG CATGTCTCTG 240 

5 ACCATCTGGA CGGTGTGTGG GGTCCTGTCA CTATTTGGAG GTTTGTCTTA TGCTGAATTG 300 

GGAACAACTA TAAAGAAATC TGGAGGTCAT TACACATATA TTTTGGAAGT CTTTGGTCCA 360 

TTACCAGCTT TTGTACGAGT CTGGGTGGAA CTCCTCATAA TACGCCCTGC AGCTACTGCT 420 

GTGATATCCC TGGCATTTGG ACGCTACATT CTGGAACCAT TTTTTATTCA ATGTGAAATC 480 

CCTGAACTTG CGATCAAGCT CATTACAGCT GTGGGCATAA CTGTAGTGAT GGTCCTAAAT 540 

10 AGCATGAGTG TCAGCTGGAG CGCCCGGATC CAGATTTTCT TAACCTTTTG CAAGCTCACA 60 0 

GCAATTCTGA TAATTATAGT CCCTGGAGTT ATGCAGCTAA TTAAAGGTCA AACGCAGAAC 660 

TTTAAAGACG CGTTTTCAGG AAGAGATTCA AGTATTACGC GGTTGCCACT GGCTTT TTAT 720 

TATGGAATGT ATGCATATGC TGGCTGGTTT TACCTCAACT TTGTTACTGA AGAAGTAGAA 780 

AACCCTGAAA AAACCATTCC CCTTGCAATA TGTATATCCA TGGCCATTGT CACCATTGGC 84 0 

15 TATGTGCTGA CAAATGTGGC CTACTTTACG ACCATTAATG CTGAGGAGCT GCTGCTTTCA 900 

AATGCAGTGG CAGTGACCTT TTCTGAGCGG CTACTGGGAA ATTTCTCATT AGCAGTTCCG 960 

ATCTTTGTTG CCCTCTCCTG CTTTGGCTCC ATGAACGGTG GTGTGTTTGC TGTCTCCAGG 1020 

TTATTCTATG TTGCGTCTCG AGAGGGTCAC CTT CCAGAAA TCCTCTCCAT GATTCATGTC 1080 

CGCAAGCACA CTCCTCTACC AGCTGTTATT GTTTTGCACC CTTTGACAAT GATAATGCTC 1140 

20 TTCTCTGGAG AC CT CG AC AG TCTTTTGAAT TTCCTCAGTT TTGCCAGGTG GCTTTTTATT 12 00 

GGGCTGGCAG TTGCTGGGCT GATTTATCTT CGATACAAAT GCCCAGATAT GCATCGTCCT 1260 

TTCAAGGTGC CACTGTTCAT CCCAGCTTTG TTTTCCTTCA CATGCCTCTT CATGGTTGCC 1320 

CTTTCCCTCT ATTCGGACCC ATTTAGTACA GGGATTGGCT T CGTCATCAC TCTGACTGGA 1380 

GTCCCTGCGT ATTATCTCTT TAT TATATGG GACAAGAAAC CCAGGTGGTT TAGAATAATG 1440 

25 TCAGAGAAAA TAACCAGAAC ATTACAAATA ATACTGGAAG TTGTACCAGA AGAAGATAAG 1500 

TTATGAACTA ATGGACTTGA GATCTTGGCA ATCTGCCCAA GGGGAGACAC AAAATAGGGA 1560 

TTTTTACTTC ATTTTCTGAA AGTCTAGAGA ATTACAACTT TGGTGATAAA CAAAAGGAGT 162 0 

CAGTTATTTT TATTCATATA TTTTAGCATA TTCGAACTAA TTTCTAAGAA ATTTAGTTAT 1680 

AACTCTATGT AGTTATAGAA AGTGAATATG CAGTTATTCT ATGAGTCGCA CAATTCTTGA 1740 

30 GTCTCTGATA CCTACCTATT GGGGTTAGGA GAAAAGACTA GACAATTACT ATGTGGT CAT 180 0 

TCTCTACAAC ATATGTTAGC ACGGCAAAGA ACCTTCAAAT TGAAGACTGA GATTTTTCTG 1860 

TATATATGGG TTTTGTAAAG ATGGTTTTAC ACACTACAGA TGTCTATACT GTGAAAAGTG 1920 

TTTTCAATTC TGAAAAAAAG CATACATCAT GATTATGGCA AAGAGGAGAG AAAGAAATTT 1980 

ATTTTACATT GACATTGCAT TGCTTCCCCT TAGATACCAA TTTAGATAAC AAACACTCAT 2 040 

35 GCTTTAATGG ATTATACCCA GAGCACTTTG AACAAAGGTC AGTGGGGATT GTTGAATACA 2100 

TTAAAGAAGA GTTTCTAGGG GCTACTGTTT ATGAGACACA TCCAGGAGTT ATGTTTAAGT 2160 

AAAAATCCTT GAGAATTTAT TATGTCAGAT GTTTTTTCAT TCATTAT CAG GAAGTTTTAG 2220 

TTATCTGTCA TTTTTTTTTT TCACATCAGT TTGATCAGGA AAGTGTATAA CACATCTTAG 22 8 0 

AGCAAGAGTT AGTTTGGTAT TAAATCCTCA TTAGAACAAC CACCTGTTTC ACTAATAACT 2340 

40 TACCCCTGAT GAGTCTATCT AAACATATGC ATTTTAAGCC TTCAAATTAC ATTATCAACA 2400 

TGAGAGAAAT AACCAACAAA GAAGATGTTC AAAATAATAG TCCCATATCT GTAATCATAT 2460 

CTACATGCAA TGTTAGTAAT TCTGAAGTTT TTTAAATTTA TGGCTATTTT TACACGATGA 2520 

TGAATTTTGA CAGTTTGTGC ATTTTCTTTA TACATTTTAT ATTCTTCTGT TAAAATATCT 2580 

CTTCAGATGA AACTGTCCAG ATTAATTAGG AAAAGGCATA TATTAACATA AAAATTGCAA 2 640 

45 AAGAAATGTC GCTGTAAATA AGATT TACAA CTGATGTTTC TAGAAAATTT CCACTTCTAT 2700 

AT CTAGGCTT TGTCAGTAAT TTCCACACCT TAATTATCAT TCAACTTGCA AAAGAGACAA 2760 

CTGATAAGAA GAAAATTGAA ATGAGAATCT GTGGATAAGT GTTTGTGTTC AGAAGATGTT 2820 

GTTTTGCCAG TATTAGAAAA TACTGTGAGC CGGGCATGGT GGCTTACATC TGTAATCCCA 2880 

GCACTTTGGG AGGCTGAGGG GGTGGATCAC CTGAGGTCGG GAGTTCTAGA CCAGCCTGAC 2 940 

50 CAACATGGAG AAACCCCATC TCTACTAAAA ATACAAAATT AGCTGGGCAT GGTGGCACAT 3 00 0 

GCTGGTAATC TCAGCTATTG AGGAGGCTGA GGCAGGAGAA TTGCTTGAAC CCGGGAGGCG 3060 

GAGGTTGCAG TGAGCCAAGA TTGCACCACT GTACTCCAGC CTGGGTGACA AAGTCAGACT 3120 

CCATCTCCAA AAAAAAAAAA AAAA 

55 Seq ID NO: 3 95 Protein sequence 
Protein Accession #: NP_055146.1 

1 11 21 31 41 51 

CIS I 1 1 1 1 1 

OU MVRKPWSTI SKGGYLQGNV NGRLPSLGNK EPPGQEKVQL KRKVTLLRGV SIIIGTIIGA 60 

GIFISPKGVL QNTGSVGMSL TIWTVCGVLS LFGALSYAEL GTTIKKSGGH YTYILEVFGP 120 

LPAFVRVWVE LLIIRPAATA VISLAFGRYI LEPFFIQCEI PELAIKLITA VGITWMVLN 180 

SMSVSWSARI QIFLTFCKLT AILIIIVPGV MQLIKGQTQN FKDAFSGRDS SITRLPLAFY 240 

YGMYAYAGWF YLNFVTEEVE NPEKTIPLAI CISMAITIGV YVLTNVAYFT TINAEELLLS 300 

65 NAVAVTFSER LLGNFSLAVP IFVALSCFGS MNGGVFAVSR LFYVASREGH LPEILSMIHV 360 

RKHTPLPAVI VLHPLTMIML FSGDLDSLLN FLSFARWLFI GLAVAGLIYL RYKCPDMHRP 420 

FKVPLFIPAL FSFTCLFMVA LSLYSDPFST GIGFVITLTG VPAYYLFIIW DKKPRWFRIM 480 

SEKITRTLQI ILEWPEEDK L 



70 



Seq ID NO: 396 DNA sequence 

Nucleic Acid Accession #: NM__00652 8 

Coding sequence: 57.. 764 



75 1 11 21 31 41 51 

I I I 



GCCGCCAGCG GCTTTCTCGG ACGCCTTGCC CAGCGGGCCG CCCGACCCCC TGCACCATGG 60 

ACCCCGCTCG CCCCCTGGGG CTGTCGATTC TGCTGCTTTT CCTGACGGAG GCTGCACTGG 120 

GCGATGCTGC TCAGGAGCCA ACAGGAAATA ACGCGGAGAT CTGTCTCCTG CCCCTAGACT 180 

80 ACGGACCCTG CCGGGCCCTA CTTCTCCGTT ACTACTACGA CAGGTACACG CAGAGCTGCC 240 

GCCAGTTCCT GTACGGGGGC TGCGAGGGCA ACGCCAACAA TTTCTACACC TGGGAGGCTT 300 

GCGACGATGC TTGCTGGAGG ATAGAAAAAG TTCCCAAAGT TTGCCGGCTG CAAGTGAGTG 360 

TGGACGACCA GTGTGAGGGG TCCACAGAAA AGTATTTCTT TAATCTAAGT TCCATGACAT 420 

GTGAAAAATT CTTTTCCGGT GGGTGTCACC GGAACCGGAT TGAGAACAGG TTTCCAGATG 480 

85 AAGCTACTTG TATGGGCTTC TGCGCACCAA AGAAAATTCC ATCATTTTGC TACAGTCCAA 540 

AAGATGAGGG ACTGTGCTCT GCCAATGTGA CTCGCTATTA TTTTAATCCA AGATACAGAA 600 

CCTGTGATGC TTTCACCTAT ACTGGCTGTG GAGGGAATGA CAATAACTTT GTTAGCAGGG 660 



332 



10 



15 



20 



25 



30 



35 



40 



45 



50 



60 



65 



70 



75 



80 



85 



WO 02/086443 

AGGATTGCAA ACGTGCATGT 
GCTTTGCCAG TAGAATCCGG 
ATCTTGTTTG TCTTTATGGC 
GCATGAGGAA ACAAATCATT 
TTCAAAAATT TGGATTTTTT 
TTTAATTTAT GGTTCAACTG 
AAATATGACT CACTCATTTC 
AAACAACATA AGACAATATA 
CC 



GCAAAAGCTT 
AAAATTCGGA 
TTATTTGCCT 
GGTGATTTAT 
TATATATAAC 
TTTGTGAGAC 
TTGGGGTCGT 
ATCATGTGCT 



TGAAAAAGAA 
AGAAGCAATT 
TTATGGTTGT 
TCACCAGTTT 
TAGCTGCTAT 
GAATTCTTGC 
ATTCCTGATT 
TTTAACATAT 



AAAGAAGATG 
TTAAACATTC 
ATCTGAAGAA 
TTATTAATAC 
TCAAATGTGA 
AATGCATAAG 
TCAGAAGAGG 
TTGAGAATAA 



CCAAAGCTTC 
TTAATATGTC 
TAATATGACA 
AAGTCACTTT 
GTCTACCATT 
ATATAAAAGC 
ATCATAACTG 
AAAGGACTAG 



Seq ID NO: 3 97 Protein sequence 
Protein Accession #: NP_006519 

1 ll 21 31 41 51 

I I I I I I 

MDPARPLGLS ILLLFLTEAA LGDAAQEPTG NNAEICLLPL DYGPCRALLL RYYYDRYTQS 

CRQFLYGGCE GNANNFYTWE ACDDACWRIE KVPKVCRLQV SVDDQCEGST EKYFFNLSSM 

TCEKFFSGGC HRNR I ENRFP DEATCMGFCA PKKIPSFCYS PKDEGLCSAN VTRYYFNPRY 

RTCDAFTYTG CGGNDNNFVS REDCKRACAK ALKKKKKMPK LRFASRIRKI RKKQF 

Seq ID NO: 398 DNA sequence 

Nucleic Acid Accession #: NM_001508.1 

Coding sequence: 1..1361 



ATGGCTTCAC 
CCCGAGTTTG 
TTCGTGATGG 
AAAGGATACT 
TTGGTGTTCC 
ACGTCCAGCT 
GCTACGCTGC 
TTCAGGTACA 
GTCACCTCCG 
GTGAACGTGC 
CAGCCCGAGA 
CAGTCCAGCA 
ATGTGCTGGA 
ACGCGGCCTC 
ACCATCATCT 
ATT CGGAGG A 
GCGTACATGA 
CCGCTCCTGT 
TGCCGCCTGT 
ACCACCGACA 
T CTGCAAGG A 
TCTAAGTCCC 
AATTCTGCTG 



11 
I 

CCAGCCTCCC 
AGGTGGCCAC 
GCCTTCTGGG 
TGCAGAAGGA 
TCATCGGCAT 
ACACCCTGTC 
TGCACGTGCT 
AGGCTGTGTC 
CCCTGGTGGC 
CCAGCCACCG 
CCTCCAATAT 
TCTTCGGCGC 
ACATGATGCA 
CGCAGCTGAG 
TCCTGAGGCT 
TCATGGCTGC 
TCCTCCTCCC 
AC ACGGTGT C 
CGCTGCAGCA 
GCGCCCGCTT 
GAACTGAGAA 
AGTCATTGAG 
CAGAGAATGG 



21 
I 

GGGCAGTGAC 
CTGGATCAAA 
GAACAGCGTC 
GGTGACAGAC 
GCCCATGGAG 
CTGCAAGCTG 
GACGCTCAGC 
GGGACCTTGC 
ACTGCCCTTG 
GGGTCTCACT 
GTCCATCTGT 
CTTCGTGGTC 
GGTGCTCATG 
GAAGTCCGAG 
GATTGTTGTG 
GGCCAAACCC 
CTTCTCGGAG 
CTCGCAGCAG 
CGCCAACCAC 
TGTGCAGCGC 
GATTTTCTTA 
TCTCGAGTCA 
TTTT CAGGAG 



31 



TGCTCCCAAA 
ATCACCCTTA 
ACCATTCGGG 
CACATGGTGA 
TTCTACAGCA 
CACACTTTCC 
TTTGAGCGCT 
CAGGTGAAGC 
CTGTTTGCCA 
TGCAACCGCT 
ACCAACCTCT 
TACCTCGTGG 
AAAAGCCAGA 
AGCGAAGAGA 
ACATTGGCCG 
AAGCACGACT 
ACGTTTTTCT 
TTTCGGCGGG 
GAGAAGCGCC 
CCGTTGCTCT 
AGCACTTTTC 
CTAGAGCCCA 
CATGAAGTTT 



41 
I 

TCATTGATCA 
TTCTGGTGTA 
TCACCCAGGT 
GTTTGGCTTG 
TCATCTGGAA 
TCTTCGAGGC 
ACATCGCCAT 
TGCTGATTGG 
TGGGTACTGA 
CCAGCACCCG 
CCAGCCGCTG 
TCCTGCTCTC 
AGGGCTCGCT 
GCAGGACCGC 
TATGCTGGAT 
GGACGAGGTC 
ACCTCAGCTC 
TGTTCGTGCA 
TGCGCGTACA 
TCGCGTCCCG 
AGAGCGAGGC 
ACTCAGGCGC 
GA 



51 
I 

CAGTCATGT C 
CCTGATCATC 
GCTGCAGAAG 
CTCGGACATC 
TCCCCTGACC 
CTGCAGCTAC 
CTGTCACCCC 
CTTCGTCTGG 
GTACCCCCTG 
CCACCACGAG 
GACCGTGTTC 
CGTAGCCTTC 
GGCCGGGGGC 
CAGGAGGCAG 
GCCCAACCAG 
CTACTTCCGG 
GGTCATCAAC 
GGTGCTGTGC 
TGCGCACTCC 
GCGCCAGTCC 
CGAGCCCCAG 
GAAACCAGCC 



Seq ID NO: 3 99 Protein sequence 
Protein Accession #: NP 001499.1 



55 i 



MASPSLPGSD 
KGYLQKEVTD 
ATIiLHVLTLS 
VNVPSHRGLT 
MCWNMMQVLM 
IRRIMAAAKP 
CRLSLQHANH 
SKSQSLSLES 



11 
I 

CSQIIDHSHV 
HMVSLACSDI 
FERYIAICHP 
CNRSSTRHHE 
KSQKGSLAGG 
KHDWTRSYFR 
EKRLRVHAHS 
LEPNSGAKPA 



21 
I 

PEFEVATWIK 
LVFLIGMPME 
FRYKAVSGPC 
QPETSNMSIC 
TRPPQLRKSE 
AYMILLPFSE 
TTDSARFVQR 
NSAAENGFQE 



31 

] 

ITLILVYLII 
FYSIIWNPLT 
QVKLLIGFVW 
TNLSSRWTVF 
SEESRTARRQ 
TFFYLSSVIN 
PLLFASRRQS 
HEV 



41 



51 



FVMGbLGNSV 
TSSYTLSCKL 
VTSAbVALPL 
QSSIFGAFW 
TIIFLRLIW 
PLLYTVSSQQ 
SARRTEKIFL 



TIRVTQVLQK 
HTFIiFEACSY 
LFAMGTEYPL 
YLWLLSVAF 
TLAVCWMPNQ 
FRRVFVQVLC 
STFQSEAEPQ 



Seq ID NO: 400 DNA sequence 

Nucleic Acid Accession #: NM_006475.1 

Coding sequence: 28.. 2538 



11 



AACAGAACTG 
TTGCTGCTTA 
AGTCGTATCA 
ACCAAAAAGA 
AAAACGACTG 
TGCCCAGCAG 
ACAACGCAGC 
TTCACTTACT 
GGTTTGGAGA 
AAGAGAATGT 
TTGGGGCTTT 
AT CCATGGGA 
CAAATTGGTA 
GCAGCTGCCA 
TTTGCTCCCA 
GGAGACAAAG 
TCTGAGTCTA 



CAACGGAGAG 
TTGTTAACCC 
GGGGTCGGGA 
AATACTTCAG 
TTTTATATGA 
TTTTGCCCAT 
GCTATTCTGA 
TTGCACCGAG 
GCAACGTGAA 
TGACCAAGGA 
TCATTAACCA 
ACCAGATTGC 
CCT CAATTCA 
TCACATCGGA 
CCAATGAGGC 
TGGCTTCCGA 
TTATGGGAGG 



21 
I 

ACT CAAGATG 
TATAAACGCC 
CCAAGGCCCA 
CACTTGTAAG 
ATGTTGCCCT 
TGACCATGTT 
CGCCT CAAAA 
TAATGAGGCT 
TGTTGAATTA 
CTTAAAAAAT 
TTATCCTAAT 
AACAAATGGT 
AGACTTCATT 
CATATTGGAG 
TTTTGAGAAA 
AGCTCTTATG 
AGCAGTCTTT 



31 

I 

ATTCCCTTTT 
AACAATCATT 
AATGTCTGTG 
AACTGGTATA 
GGTTATATGA 
TATGGCACTC 
CTGAGGGAGG 
TGGGACAACT 
CTGAATGCTT 
GGCATGATTA 
GGGGTTGTCA 
GTTGTCCATG 
GAAGCAGAAG 
GCCCTTGGAA 
CTTCCACGAG 
AAGTACCACA 
GAGACGCTGG 



41 

I ' 

TACCCATGTT 
ATGACAAGAT 
CCCTTCAACA 
AAAAGTCCAT 
GAATGGAAGG 
TGGGCAT CGT 
AGATCGAGGG 
TGGATTCTGA 
TACATAGTCA 
TTCCTTCAAT 
CTGTTAATTG 
TCATTGACCG 
ATGACCTTTC 
GAGACGGTCA 
GTGT CCTAGA 
TCTTAAATAC 
AAGGAAATAC 



51 
I 

TTCTCTACTA 
CTTGGCTCAT 
GATTTTGGGC 
CTGTGGACAG 
AATGAAAGGC 
GGGAGCCACC 
AAAGGGATCC 
TATCCGTAGA 
CATGATTAAT 
GTATAACAAT 
TGCTCGAATC 
TGTGCTTACA 
ATCTTTTAGA 
CTTCACACTC 
AAGGTTCATG 
TCTCCAGTGT 
AATTGAGATA 



720 
780 
840 
900 
960 
1020 
1080 
1140 
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60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 



60 
120 
180 
240 
300 
360 
420 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
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GGATGTGACG GTGACAGTAT AACAGTAAAT GGAAT CAAAA TGGTGAACAA AAAGGATATT 1080 

GTGACAAATA ATGGTGTGAT CCATTTGATT GATCAGGTCC TAATTCCTGA TTCTGCCAAA 1140 

CAAGTTATTG AGCTGGCTGG AAAACAGCAA ACCACCTTCA CGGATCTTGT GGCCCAATTA 12 00 

GGCTTGGCAT CTGCTCTGAG GCCAGATGGA GAATACACTT TGCTGGCACC TGTGAATAAT 1260 

5 GCATTTTCTG ATGATACTCT CAGCATGGTT CAGCGCCTCC TTAAATTAAT TCTGCAGAAT 132 0 

CACATATTGA AAGTAAAAGT TGGCCTTAAT GAGCTTTACA ACGGGCAAAT ACTGGAAACC 1380 

ATCGGAGGCA AACAGCTCAG AGTCTTCGTA TATCGTACAG CTGTCTGCAT TGAAAATTCA 1440 

TGCATGGAGA AAGGGAGTAA GCAAGGGAGA AACGGTGCGA TTCACATATT CCGCGAGATC 1500 

ATCAAGCCAG CAGAGAAATC CCT CCATGAA AAGTTAAAAC AAGATAAGCG CTTTAGCACC 15 60 

10 TTCCTCAGCC TACTTGAAGC TGCAGACTTG AAAGAGCTCC TGACACAACC TGGAGACTGG 1620 

ACATTATTTG TGCCAACCAA TGATGCTTTT AAGGGAATGA CTAGTGAAGA AAAAGAAATT 1680 

CTGATACGGG ACAAAAATGC TCTTCAAAAC ATCATTCTTT ATCACCTGAC ACCAGGAGTT 1740 

TTCATTGGAA AAGGATTTGA ACCTGGTGTT ACTAACATTT TAAAGACCAC AGAAGGAAGC 1800 

AAAATCTTTC TGAAAGAAGT AAATGATACA CTTCTGGTGA ATGAATTGAA ATCAAAAGAA 1860 

15 TCTGACATCA TGACAACAAA TGGTGTAATT CATGTTGTAG ATAAACTCCT CTAT CCAGCA 1920 

GACACACCTG TTGGAAATGA TCAACTGCTG GAAATACTTA ATAAATTAAT CAAATACATC 1980 

CAAATTAAGT TTGTTCGTGG TAGCACCTTC AAAGAAAT CC CCGTGACTGT CTATACAACT 2 040 

AAAATTATAA CCAAAGTTGT GGAACCAAAA ATTAAAGTGA TTGAAGGCAG TCTTCAGCCT 2100 

ATTAT CAAAA CTGAAGGACC CACACTAACA AAAGT CAAAA TTGAAGGTGA ACCTGAATTC 2160 

20 AGACTGATTA AAGAAGGTGA AACAATAACT GAAGTGATCC ATGGAGAGCC AATTATTAAA 2220 

AAATACACCA AAATCATTGA TGGAGTGCCT GTGGAAATAA CTGAAAAAGA GACACGAGAA 2280 

GAACGAATCA TTACAGGTCC TGAAATAAAA TACACTAGGA TTTCTACTGG AGGTGGAGAA 2340 

ACAGAAGAAA CTCTGAAGAA ATTGTTACAA GAAGAGGTCA CCAAGGTCAC CAAATTCATT 2400 

GAAGGTGGTG ATGGTCATTT ATTTGAAGAT GAAGAAATTA AAAGACTGCT TCAGGGAGAC 2460 

25 ACACCCGTGA GGAAGTTGCA AGCCAACAAA AAAGTTCAAG GTTCTAGAAG ACGATTAAGG 252 0 

GAAGGTCGTT CTCAGTGAAA ATCCAAAAAC CAGAAAAAAA TGTTTATACA ACCCTAAGTC 2580 

AATAACCTGA CCTTAGAAAA TTGTGAGAGC CAAGTTGACT TCAGGAACTG AAACAT CAGC 2 640 

ACAAAGAAGC AATCAT CAAA TAATTCTGAA CACAAATTTA ATATTTTTTT TTCTGAATGA 2 700 

GAAACATGAG GGAAATTGTG GAGTTAGCCT CCTGTGGTAA AGGAATTGAA GAAAATATAA 2 760 

30 CACCTTACAC CCTTTTTCAT CTTGACATTA AAAGTTCTGG CTAACTTTGG AATCCATTAG 2820 

AGAAAAATCC TTGTCACCAG ATTCATTACA ATTCAAATCG AAGAGTTGTG AACTGTTATC 2880 

CCATTGAAAA GACCGAGCCT TGTATGTATG TTATGGATAC ATAAAATGCA CGCAAGCCAT 2 940 

TATCTCTCCA TGGGAAGCTA AGTTATAAAA ATAGGTGCTT GGTGTACAAA ACTTTTTATA 3 00 0 

TCAAAAGGCT TTGCACATTT CTATATGAGT GGGTTTACTG GTAAATTATG TTATTTTTTA 3060 

35 CAACTAATTT TGTACTCTCA GAATGTTTGT CATATGCTTC TTGCAATGCA TATTTTTTAA 312 0 

TCTCAAACGT TTCAATAAAA CCATTTTTCA GATATAAAGA GAATTACTTC AAATTGAGTA 3180 

ATT C AG AAAA ACTCAAGATT TAAGTTAAAA AGTGGTTTGG ACTTGGGAA 

Seq ID NO: 401 Protein sequence 
40 Protein Accession #: NP_00 6466.1 

1 11 21 31 41 51 

l I l l l l 

MIPFLPMFSL LLLLIVNPIN ANNHYDKILA HSRIRGRDQG PNVCALQQIL GTKKKYFSTC 60 

45 KNWYKKSICG QKTTVLYECC PGYMRMEGMK GCPAVLPIDH VYGTLGIVGA TTTQRYSDAS 12 0 

KLREEIEGKG SFTYFAPSNE AWDNLDSDIR RGLE SNVNVE LLNALHSHMI NKRMLTKDLK 180 

NGMIIPSMYN NLGLFINHYP NGWTVNCAR I IHGNQIATN GWHVIDRVL TQIGTSIQDF 240 

IEAEDDLSSF RAAAITSDIL EALGRDGHFT LFAPTNEAFE KLPRGVLERF MGDKVASEAL 300 

MKYHILNTLQ CSESIMGGAV FETLEGNTIE IGCDGDSITV NGIKMVNKKD IVTNNGVIHL 3 60 

50 IDQVLIPDSA KQVIELAGKQ QTTFTDLVAQ LGLASALRPD GEYTLLAPVN NAFSDDTLSM 420 

VQRLLKLILQ NHILKVKVGL NELYNGQILE TIGGKQLRVF VYRTAVCI EN SCMEKGSKQG 480 

RNGAIHIFRE IIKPAEKSLH EKLKQDKRFS TFLSLLEAAD LKELLTQPGD WTLFVPTNDA 540 

FKGMTSEEKE ILIRDKNALQ NIILYHLTPG VFIGKGFEPG VTNILKTTQG SKI FLKEVND 60 0 

TLLVNELKSK ESDIMTTNGV IHWDKLLYP ADTPVGNDQL LEILNKLIKY IQIKFVRGST 660 

55 FKEIPVTVYT TKIITKWEP KIKVIEGSLQ PIIKTEGPTL TKVKIEGEPE FRLIKEGETI 72 0 

TEVIHGEPII KKYTKI IDGV PVEITEKETR EERIITGPEI KYTRISTGGG ETEETLKKXiL 780 

QEEVTKVTKF IEGGDGHLFE DEEIKRLLQG DTPVRKLQAN KKVQGSRRRL REGRSQ 

Seq ID NO: 402 DNA sequence 
60 Nucleic Acid Accession NM_002416 
Coding sequence: 40.. 417 

1 11 21 31 41 51 

I I I I I ! 

05 ATCCAATACA GGAGTGACTT GGAACTCCAT TCTATCACTA TGAAGAAAAG TGGTGTTCTT 60 

TTCCTCTTGG GCATCATCTT GCTGGT TCTG ATTGGAGTGC AAGGAACCCC AGTAGTGAGA 120 

AAGGGTCGCT GTTCCTGCAT CAGCACCAAC CAAGGGACTA TCCACCTACA ATCCTTGAAA 180 

GACCTTAAAC AATTTGCCCC AAGCCCTTCC TGCGAGAAAA T TGAAAT CAT TGCTACACTG 240 

AAGAATGGAG TTCAAACATG TCTAAACCCA GATT CAGCAG ATGTGAAGGA ACTGATTAAA 300 

70 AAGTGGGAGA AACAGGTCAG CCAAAAGAAA AAGCAAAAGA ATGGGAAAAA ACATCAAAAA 3 60 

AAGAAAGTTC TGAAAGTTCG AAAATCTCAA CGTTCTCGTC AAAAGAAGAC TACATAAGAG 42 0 

ACCACTTCAC CAATAAGTAT TCTGTGTTAA AAATGTTCTA TTTTAATTAT ACCGCTATCA 480 

TTCCAAAGGA GGATGGCATA TAATACAAAG GCTTAT TAAT TTGACTAGAA AATTTAAAAC 540 

ATTACT CTGA AATTGTAACT AAAGTTAGAA AGTTGAT TTT AAGAATCCAA ACGTTAAGAA 600 

75 TTGTTAAAGG CTATGATTGT CTTTGTTCTT CTACCACCCA CCAGTTGAAT TTCATCATGC 660 

TTAAGGCCAT GAT T T TAG CA ATACCCATGT CTACACAGAT GTTCACCCAA CCACATCCCA 720 

CTCACAACAG CTGCCTGGAA GAGCAGCCCT AGGCTTCCAC GTACTGCAGC CTCCAGAGAG 780 

TATCTGAGGC ACATGTCAGC AAGTCCTAAG CCTGTTAGCA TGCTGGTGAG CCAAGCAGTT 840 

TGAAATTGAG CTGGACCTCA CCAAGCTGCT GTGG CCATCA ACCTCTGTAT TTGAATCAGC 900 

80 CTACAGGCCT CACACACAAT GTGTCTGAGA GATT CATGCT GATTGTTATT GGGTAT CACC 960 

ACTGGAGATC ACCAGTGTGT GGCTTTCAGA GCCTCCTTTC TGGCTTTGGA AGCCATGTGA 1020 

TTCCATCTTG CCCGCTCAGG CTGACCACTT TATTTCTTTT TGTTCCCCTT TGCTTCATTC 1080 

AAGTCAGCTC TTCTCCATCC TACCACAATG CAGTGCCTTT CTTCTCTCCA GTGCACCTGT 1140 

CATATGCTCT GATTTATCTG AGTCAACTCC TTTCTCATCT TGTCCCCAAC ACCCCACAGA 12 00 

85 AGTGCTTTCT TCTCCCAATT CATCCTCACT CAGTCCAGCT TAGTTCAAGT CCTGCCTCTT 12 60 

AAATAAACCT TTTTGGACAC ACAAATTATC TTAAAACTCC TGTTTCACTT GGTTCAGTAC 1320 

CACATGGGTG AACACTCAAT GGTTAACTAA TTCTTGGGTG TTTATCCTAT CTCTCCAACC 1380 
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10 



15 



20 
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AGATTGTCAG CTCCTTGAGG 
CTAATAATAC TGTGGAACTA 
TGGCAACCAG ACCATTGTCT 
CTAGCCTCTG GTAACCTCTT 
GATGCAACAT CCTTGTCTTT 
GCACGTGGTA AAACACTTGC 
AAAAT CAT AT AATCTTACAA 
CCAACCATAC AAAAATTCCT 
TCTAAGATCT AACAAGATAG 
AGTTTTATTG TCCGTTTACT 
TCTCCCATGA AGAAAGGGAA 
TAGTGGAAGC ATGATTGGTG 
GGAGGTTCAG TGAATTGTGT 
CTTTCCCAAA TTGAATCACT 
TCCCACCCGA ACGTCTTATC 
AAAAATCTAA GTGTTTCATA 
GTAGACAGTA TATAACTAAC 
TCATTTATCA TATATATACA 
AAACAGTATT GACTTGTATA 
TATCAATAAA TAGACCATTA 
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GCAAGAGCCA 
GGTTTTAATA 
CAGAGCAGGT 
ACTTATTATC 
TTATGACAGG 
GGATATTCTG 
TGAAAAGGAC 
TTTCCCGAAG 
CCACCGAGAT 
TGTTTCAGAG 
CGGTGAAGTA 
CCCAGTTAGC 
AGGAGAGGTT 
GCTCACACTG 
TAATCATGAA 
AATTTGAGAG 
AACCAAAGAC 
TACATGCATA 
CCTTGTAATT 
ATCAG 



CAGTATATTT 
ATTTTTTAAT 
GCTGGCTCTT 
TTCAGGACAC 
ATGTTTGCTC 
GACTGTTTTT 
TTTATAGATC 
GAAAAGGGCT 
CCTTATCGAA 
TTTGTATTGT 
CTAAGCGCTA 
CT CTGCAGG A 
GTCTGTGGCC 
CTGATGATTT 
ACTCCCTAGT 
TCTGTGACCC 
TACATATTGT 
CACTCTCAAA 
TGAAATATTT 



CCCTGTTTCT 
TGATGTTGTT 
TCCTGGCTAC 
TCACTACAGG 
AGCTTCTCCA 
AAAAAATATA 
AGCCAGTGAC 
TTCTCAATAA 
ACTCATTTTA 
GATTATCAAT 
GAGGAAGCAG 
TGTGGAAACC 
AGAATTTAAA 
AGAGTGCTGT 
TCCTTCATGT 
ACTTACCTTG 
CACTGACACA 
GCAAATAATT 
TCTTTGTTAA 



TCCACAGTGC 1440 

ATGGGCAGGA 1500 

TCCATGTTGG 1560 

GACCAGGGAT 162 0 

ACAATAAGAA 1680 

CAGTTTACCG 1740 

CAACCTTTTC 1800 

GCCTCAGCTT 1860 

GGCAAATATG 1920 

T ACCACACCA 1980 

CCAAGT CGGT 2040 

TCCTTCCAGG 2100 

CCTATACTCA 2160 

CCGGTGGAGA 222 0 

AACTTCCCTG 22 80 

CATCT CACAG 2340 

CACGTTATAA 2400 

TTTCACTTCA 2460 

AATAGAATGG 2520 



25 



30 



35 



40 



45 



50 



55 



60 



65 



Seq ID NO: 403 Protein sequence 
Protein Accession #: NP_002407 

1 11 21 31 41 51 

i I l I l I 

MKKSGVLFLL GI ILLVLIGV QGTPWRKGR CSCISTNQGT IHLQSLKDLK QFAPSPSCEK 
IEIIATLKNG VQTCLNPDSA DVKELIKKWE KQVSQKKKQK NGKKHQKKKV LKVRKSQRSR 
QKKTT 

Seq ID NO: 404 DNA sequence 

Nucleic Acid Accession #: NM_006670 

Coding sequence: 85.. 1347 



70 



CCGGCTCGCG 
AGCTCCGGGG 
GACGGGCGTC 
TCTCCCACCT 
TCCGCCCAGC 
CGCACAGTCA 
GTGCGCAACC 
CGCCGGCCGC 
GTGCGCGCGG 
CCACTGGCCG 
AGTCCCCTTG 
CGGAGCTTCG 
CGCCGCTTGG 
CTGCCCAGCC 
TCCTTCCGCA 
CTTCACAATG 
AACAATCCCT 
GAGGTAGTGC 
GTCCTCTTGG 
CAAACCTCTT 
GTTTTGTATT 
AGGGATCACA 
AACCTCAGTT 
CATGAGATGT 
TAGATACAAC 
TTTCTCGGTG 
TTCTTTTTCT 
TGGGCTTCTT 
ACAGATAGCA 
TAT CAGTTTT 
CTGCAGACGT 
AGAGCATGCT 
TTCTTTGACA 
TTTTAATAAA 
ATTCTTAAAA 



11 
I 

CCCTCCGGGC 

AAACGCGAGC 

TGCGGCTGGC 

CCTCGGCATC 

CCCCGCTGCC 

AGTGCGTTAA 

TCTTCCTTAC 

CGCTGGCGGA 

GCGCCTTCGA 

ACCTCAGTCC 

TGGAACTGAT 

AGGGCATGGT 

AGCTGGCCAG 

TCAGGCACCT 

AC CTGAC ACA 

GCACCCTGGC 

GGGTCTGCGA 

AGGGCAAAGA 

AACTCAACAG 

ATGTCTTCCT 

TGAACCGCAA 

TGGAAGGGTA 

CTAACTCGGA- 

AGACTTAAGC 

GGACTTTGAC 

TGTTCTGTTA 

TGGAACTCCT 

GCTGTCTGTC 

TTCAACAAAA 

ATTCTCATGT 

TAGCAGGCTC 

TACATTTTAC 

AAGTAAATTA 

CTGCATCGAG 

GAA 



21 



31 



CCAGCCTCCC 
CGCGATGCCT 
GCGACTAGCG 
CTCCTTCTCC 
GGACCAGTGC 
CCGCAATCTG 
CGGCAACCAG 
GCTGGCCGCG 
GCATCTGCCC 
CTTCGCTTTC 
CCTGAACCAC 
GGTGGCGGCC 
CAACCACTTC 
GGACTTAAGT 
TCTAGAAAGC 
TGAGT TGCAA 
CTGCCACATG 
CCGGCTCACC 
TGCTGACCTG 
GGGTATTGTT 
GGGGATAAAA 
TCATTACAGA 
TGT CTGAGAA 
TTTATCCCTA 
TAAAAGCAGT 
ATGTAAGACG 
CAACACGTAT 
TCTCTCTCAG 
GCTGCCTCAA 
ACCTAAGTTG 
TTCAAAATAA 
TGTTCTGCAT 
CTTTTTTGAT 
AT CCAACCG A 



GAGCCTTCGG 
GGGGGGTGCT 
CTGGTACTCC 
TCCTCGGCGC 
CCCGCGCTGT 
ACCGAGGTGC 
CTGGCCGTGC 
CTCAACCTCA 
AGCCTGCGCC 
TCGGGCAGCA 
ATCGTGCCCC 
CTGCTGGCGG 
CTTTACCTGC 
AATAATTCGC 
CTCCACCTGG 
GGTCTACCCC 
GCAGACATGG 
TGTGCATATC 
GACTGTGACC 
TTAGCCCTGA 
AAGTGGATGC 
TATGAAATCA 
ATATTAGAGG 
CTAGGCTTGC 
GAAGGGGATT 
ATGAACAGTT 
GGAGGGATTT 
TACAGTTCAA 
CTTTTTCGAG 
TGGAGAAAAT 
CTCCATGGTG 
ATTACAAAAA 
TGCAGTTTAT 
CTGAATTGTT 



41 
I 

AGCGGGCGCC 
CCCGGGGCCC 
TGGGCTGGGT 
CGTTCCTGGC 
GCGAGTGCTC 
CCACGGACCT 
TCCCTGCCGG 
GCGGCAGCCG 
AGCTCGACCT 
ATGCCAGCGT 
CTGAAGATGA 
GCCGTGCACT 
CGCGGGATGT 
TGGTGAGCCT 
AGGACAATGC 
ACATTAGGGT 
TGACCTGGCT 
CGGAAAAAAT 
CGATTCTTCC 
TAGGCGCTAT 
ATAACATCAG 
ATGCGGACCC 
ACAGACCAAG 
TCCACTTTCA 
TGCTTCCTTG 
GTGTATAGTG 
TTCAGGTTTC 
GGTGTAGCAA 
AAAAATACTT 
AATTGCATCC 
CACAGGAGCA 
ATAACTTGCA 
ATGAAAATGT 
AAAAAAAAAA 



51 



GTCCCAGCCC 
CGCCGCCGGG 
CTCCTCGTCT 
TTCCGCCGTG 
CGAGGCAGCG 
GCCCGCCTAC 
CGCCTTCGCC 
CCTGGACGAG 
CAGCCACAAC 
CTCGGCCCCC 
GCGGCAGAAC 
GCAGGGGCTC 
GCTGGCCCAA 
GACCTACGTG 
CCTCAAGGTC 
TTTCCTGGAC 
CAAGGAAACA 
GAGGAATCGG 
CCCATCCCTG 
TTTCCTCCTG 
AGATGCCTGC 
CAGATTAACA 
GACAACTCTG 
TCCTCCACTA 
TTATGTAAAG 
TTTTACCCTC 
AGCATGAACA 
GTGTACCCAC 
TATT CATAAA 
TATAAACTGC 
CCTGCATCCA 
ACTTCATAAC 
ACTGATTTTT 
AAAAATAAAG 



60 
120 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
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Seq ID NO: 405 Protein sequence 
Protein Accession #: NP 006661 



MPGGCSRGPA 
QCPALCECSE 
AALNLSGSRL 
NHIVPPEDER 
LSNNSLVSLT 
HMADMVTWLK 
IVLALIGAIF 



11 
I 

AGDGRDRLAR 
AARTVKCVNR 
DEVRAGAFEH 
QNRSFEGMW 
YVSFRNLTHL 
ETEWQGKDR 
LLVLYLNRKG 



21 
I 

LALiVLLGWVS 
NLTEVPTDLiP 
LPSLRQLDLS 
AALLAGRALQ 
ESLHLEDNAIi 
LTCAYPEKMR 
IKKWMHNIRD 



31 

I 

SSSPTSSASS 
AYVRNLFLTG 
HNPLADLSPF 
GLRRLELASN 
KVLHNGTLAE 
NRVLLELNSA 
ACRDHMEGYH 



41 



FSSSAPFIiAS 
NQIjAVLPAGA 
AFSGSNASVS 
HFLYLPRDVL 
LQGLPHIRVF 
DLDCDPILPP 
YRYEINADPR 



51 

I 

AVSAQPPLPD 60 

FARRPPLAEL 120 

APSPLVELIL 180 

AQLPSLRHLD 240 

LDNNPWVCDC 300 

SLQTSYVFLG 3 60 
LTNLSSNSDV 



Seq ID NO: 406 DNA sequence 

Nucleic Acid Accession #: Eos sequence 
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J ATGGCTGGGG GGTGCTCCCG GGGCCCCGCC GCCGGGGACG GGCGTCTGCG GCTGGCGCGA 60 

CTAGCGCTGG TACTCCTGGG CTGGGTCTCC TCGTCTTCTC CCACCTCCTC GGCATCCTCC 120 

TTCTCCTCCT CGGCGCCGTT CCTGGCTTCC GCCGTGTCCG CCCAGCCCCC GCTGCCGGAC 180 

CAGTGCCCCG CGCTGTGCGA GTGCTCCGAG GCAGCGCGCA C AGT CAAGTG CGTTAACCGC 240 

AATCTGACCG AGGTGCCCAC GGACCTGCCC GCCTACGTGC GCAACCTCTT CCTTACCGGC 300 

10 AACCAGCTGG CCAGCAACCA CTTCCTTTAC CTGCCGCGGG ATGTGCTGGC CCAACTGCCC 3 60 

AGCCTCAGGC ACCTGGACTT AAGTAATAAT TCGCTGGTGA GCCTGACCTA CGTGTCCTTC 420 

CGCAACCTGA CACATCTAGA AAGCCTCCAC CTGGAGGACA ATGCCCTCAA GGTCCTTCAC 480 

AATGGCACCC TGGCTGAGTT GCAAGGT CTA CCCCACATTA GGGTTTTCCT GGACAACAAT 540 

CCCTGGGTCT GCGACTGCCA CATGGCAGAC ATGGTGACCT GGCTCAAGGA AACAGAGGTA 600 

15 GTGCAGGGCA AAGACCGGCT CACCTGTGCA T AT CCGGAAA AAATGAGGAA TCGGGTCCTC 660 

TTGGAACTCA ACAGTGCTGA CCTGGACTGT GACCCGATTC TTCCCCCATC CCTGCAAACC 72 0 

TCTTATGTCT T CCTGGGT AT TGTTTTAGCC CTGATAGGCG CTATTTTCCT CCTGGTTTTG 780 

TATTTGAACC GCAAGGGGAT AAAAAAGTGG ATGCATAACA TCAGAGATGC CTGCAGGGAT 840 

CACATGGAAG GGTATCATTA CAGATATGAA ATCAATGCGG ACCCCAGATT AACAAACCTC 90 0 

20 AGTTCTAACT CGGATGTCCT CGAGTGA 

Seq ID NO: 407 Protein sequence 
Protein Accession #: Eos sequence 

25 1 11 21 31 41 51 

I I i I I I 

MPGGCSRGPA AGDGRLRLAR LALVLLGWVS SSSPTSSASS FSSSAPFLAS AVSAQPPLPD 60 

QCPALCECSE AARTVKCVNR NIjTEVPTDLP AYVRNLFLTG NQLASNHFLY LPRDVLAQLP 120 

SLRHLDLSNN SLVSLTYVSF RNLTHLESLH LEDNALKVLH NGTLAELQGL PHIRVFLDNN 180 

30 PWVCDCHMAD MVTWLKETEV VQGKDRLTCA YPEKMRNRVL LELNSADLDC DPILPPSLQT 240 

SYVFLGIVLA LIGAIFLLVL YLNRKGIKKW MHNIRDACRD HMEGYHYRYE INADPRLTNL 300 
SSNSDVLE 

Seq ID NO: 408 DNA sequence 
35 Nucleic Acid Accession #: NM_000095 . 1 
Coding sequence: 26.-22 99 

1 11 21 31 41 51 

An 1 1 1 1 1 1 

4U CAGCACCCAG CTCCCCGCCA CCGCCATGGT CCCCGACACC GCCTGCGTTC TTCTGCTCAC 60 

CCTGGCTGCC CTCGGCGCGT CCGGACAGGG CCAGAGCCCG TTGGGCTCAG ACCTGGGCCC 120 

GCAGATGCTT CGGGAACTGC AGGAAACCAA CGCGGCGCTG CAGGACGTGC GGGACTGGCT 180 

GCGGCAGCAG GTCAGGGAGA TCACGTTCCT GAAAAACACG GTGATGGAGT GTGACGCGTG 240 

CGGGATGCAG CAGT CAGT AC GCACCGGCCT ACCCAG CGTG CGGCCCCTGC TCCACTGCGC 300 

45 GCCCGGCTTC TGCTTCCCCG GCGTGGCCTG CATCCAGACG GAGAGCGGCG GCCGCTGCGG 3 60 

CCCCTGCCCC GCGGGCTTCA CGGGCAACGG CTCGCACTGC ACCGACGTCA ACGAGTGCAA 420 

CGCCCACCCC TGCTTCCCCC GAGTCCGCTG TATCAACACC AGCCCGGGGT TCCGCTGCGA 48 0 

GGCTTGCCCG CCGGGGTACA GCGGCCCCAC CCACCAGGGC GTGGGGCTGG CTTTCGCCAA 540 

GGCCAACAAG CAGGTTTGCA CGGACATCAA CGAGTGTGAG ACCGGGCAAC ATAACTGCGT 60 0 

50 CCCCAACTCC GTGTG CATCA ACACCCGGGG CTCCTTCCAG TGCGGCCCGT GCCAGCCCGG 660 

CTTCGTGGGC GACCAGGCGT CCGGCTGCCA GCGCGGCGCA CAGCGCTTCT GCCCCGACGG 720 

CTCGCCCAGC GAGTGCCACG AGCATGCAGA CTGCGTCCTA GAGCGCGATG GCTCGCGGTC 780 

GTGCGTGTGT CGCGTTGGCT GGGCCGGCAA CGGGATCCTC TGTGGTCGCG ACACTGACCT 840 

AGACGGCTTC CCGGACGAGA AGCTGCGCTG CCCGGAGCCG CAGTGCCGTA AGGACAACTG 900 

55 CGTGACTGTG CCCAACTCAG GGCAGGAGGA TGTGGACCGC GATGGCATCG GAGACGCCTG 960 

CGATCCGGAT GCCGACGGGG ACGGGGTCCC CAATGAAAAG GACAACTGCC CGCTGGTGCG 102 0 

GAACCCAGAC CAGCGCAACA CGGACGAGGA CAAGTGGGGC GATGCGTGCG ACAACTGCCG 1080 

GTCCCAGAAG AACGACGACC AAAAGGACAC AGACCAGGAC GGCCGGGGCG ATGCGTGCGA 1140 

CGACGACATC GACGGCGACC GGAT CCGCAA CCAGGCCGAC AACTGCCCTA GGGTACCCAA 1200 

60 CTCAGACCAG AAGGACAGTG ATGGCGATGG TATAGGGGAT GCCTGTGACA ACTGTCCCCA 1260 

GAAGAGCAAC CCGGATCAGG CGGATGTGGA CCACGACTTT GTGGGAGATG CTTGTGACAG 1320 

CGATCAAGAC CAGGATGGAG ACGGACATCA GGACTCTCGG GACAACTGTC CCACGGTGCC 1380 

TAACAGTGCC CAGGAGGACT CAGACCACGA TGGCCAGGGT GATGCCTGCG ACGACGACGA 1440 

CGACAATGAC GGAGT CCCTG ACAGTCGGGA CAACTGCCGC CTGGTGCCTA ACCCCGGCCA 1500 

65 GGAGGACGCG GACAGGGACG GCGTGGGCGA CGTGTGCCAG GACGACTTTG ATGCAGACAA 1560 

GGTGGTAGAC AAGATCGACG TGTGTCCGGA GAACGCTGAA GT CACGCTCA CCGACTTCAG 162 0 

GGCCTTCCAG ACAGTCGTGC TGGACCCGGA GGGTGACGCG CAGATTGACC CCAACTGGGT 1680 

GGTGCTCAAC CAGGGAAGGG AGATCGTGCA GACAATGAAC AGCGACCCAG GCCTGGCTGT 1740 

GGGTTACACT GCCTTCAATG GCGTGGACTT CGAGGGCACG TTCCATGTGA ACACGGTCAC 1800 

70 GGATGACGAC TATGCGGGCT TCATCTTTGG CTACCAGGAC AGCTCCAGCT TCTACGTGGT 1860 

CATGTGGAAG C AG ATGG AG C AAACGTATTG GCAGGCGAAC CCCTTCCGTG CTGTGGCCGA 192 0 

GCCTGGCATC CAACTCAAGG CTGTGAAGTC TTCCACAGGC CCCGGGGAAC AGCTGCGGAA 1980 

CGCTCTGTGG CATACAGGAG ACACAGAGTC CCAGGTGCGG CTGCTGTGGA AGGACCCGCG 2040 

AAACGTGGGT TGGAAGGACA AGAAGTCCTA TCGTTGGTTC CTGCAGCACC GGCCCCAAGT 2100 

75 GGGCTACATC AGGGTGCGAT TCTATGAGGG CCCTGAGCTG GTGGCCGACA GCAACGTGGT 2160 

CTTGGACACA ACCATGCGGG GTGGCCGCCT GGGGGTCTTC TGCTTCTCCC AGGAGAACAT 2220 

CATCTGGGCC AACCTGCGTT ACCGCTGCAA TGACACCATC CCAGAGGACT ATGAGACCCA 22 8 0 

TCAGCTGCGG CAAGCCTAGG GACCAGGGTG AGGACCCGCC GGATGACAGC CACCCTCACC 2340 

GCGGCTGGAT GGGGGCTCTG CACCCAGCCC AAGGGGTGGC CGTCCTGAGG GGGAAGTGAG 240 0 

80 AAGGGCTCAG AGAGGACAAA ATAAAGTGTG TGTGCAGGG 

Seq ID NO: 40 9 Protein sequence 
Protein Accession #: NP_000086.1 

85 1 11 21 31 41 51 

I I i I I I 

MVPDTACVLL LTLAALGASG QGQSPLGSDL GPQMLRELQE TNAALQDVRD WLRQQVREIT 60 



336 



WO 02/086443 

FLKNTVMECD ACGMQQSVRT GLPSVRPLbH 
NGSHCTDVNE CNAHPCFPRV RCINTSPGFR 
INECETGQHN CVPNSVCINT RGSFQCGPCQ 
ADCVLERDGS RSCVCRVGWA GNGILCGRDT 
EDVDRDGIGD ACDPDADGDG VPNEKDNCPL 
DTDQDGRGDA CDDDIDGDRI RNQADNCPRV 
VDHDFVGDAC DSDQDQDGDG HQDSRDNCPT 
RDNCRLVPNP GQEDADRDGV GDVCQDDFDA 
PEGDAQIDPN WWLNQGREI VQTMNSDPGL 
FGYQDSSSFY WMWKQMEQT YWQANPFRAV 
ESQVRLLWKD PRNVGWKDKK SYRWFLQHRP 
RLGVFCFSQE NIIWANLRYR CNDT I PEDYE 



CAPGFCFPGV ACIQTESGGR CGPCPAGFTG 
CEACPPGYSG PTHQGVGLAF AKANKQVCTD 
PGFVGDQASG CQRGAQRFCP DGSPSECHEH 
DLDGFPDEKIj RCPEPQCRKD NCVTVPNSGQ 
VRNPDQRNTD EDKWGDACDN CRSQKNDDQK 
PNSDQKDSDG DGIGDACDNC PQKSNPDQAD 
VPNSAQEDSD HDGQGDACDD DDDNDGVPDS 
DKWDKIDVC PENAEVTLTD FRAFQTWLD 
AVGYTAFNGV DFEGTFHVNT VTDDDYAGF I 
AEPGIQLKAV KSSTGPGEQL RNALWHTGDT 
QVGYIRVRFY EGPELVADSN WLDTTMRGG 
THQLRQA 



Seq ID NO: 410 DNA sequence 

Nucleic Acid Accession #: NM_00 1565.1 

Coding sequence: 6 7.. 3 63 



1 11 21 31 41 51 

I l I I l I 

GAGACATTCC TCAATTGCTT AGACATATTC TGAGCCTACA GCAGAGGAAC CTCCAGTCTC 
AGCACCATGA ATCAAACTGC GATTCTGATT TGCTGCCTTA TCTTTCTGAC TCTAAGTGGC 
ATTCAAGGAG TACCTCTCTC TAGAACCGTA CGCTGTACCT GCATCAGCAT TAGTAATCAA 
CCTGTTAATC CAAGGTCTTT AGAAAAACTT GAAATTATTC CTGCAAGCCA ATTTTGTCCA 
CGTGTTGAGA TCATTGCTAC AATGAAAAAG AAGGGTGAGA AGAGATGTCT GAATCCAGAA 
TCGAAGGCCA TCAAGAATTT ACTGAAAGCA GTTAGCAAGG AAATGTCTAA AAGATCTCCT 
TAAAACCAGA GGGGAGCAAA ATCGATGCAG TGCTTCCAAG GATGGACCAC ACAGAGGCTG 
CCTCTCCCAT CACTTCCCTA CATGGAGTAT ATGT CAAGCC ATAATTGTTC TTAGTTTGCA 
GTTACACTAA AAGGTGACCA ATGATGGTCA CCAAATCAGC TGCTACTACT CCTGTAGGAA 
GGTTAATGTT CATCATCCTA AGCTATTCAG TAATAACTCT ACCCTGGCAC TATAATGTAA 
GCTCTACTGA GGTG CTATGT TCTTAGTGGA TGTTCTGACC CTGCTTCAAA TATTTCCCTC 
ACCTTTCCCA TCTTCCAAGG GTACTAAGGA ATCTTTCTGC TTTGGGGTTT ATCAGAATTC 
TCAGAATCTC AAATAACTAA AAGGTATGCA ATCAAATCTG CTTTTTAAAG AATGCTCTTT 
ACTTCATGGA CTTCCACTGC CATCCTCCCA AGGGGCCCAA ATTCTTTCAG TGGCTACCTA 
CATACAATTC CAAACACATA CAGGAAGGTA GAAATATCTG AAAATGTATG TGTAAGTATT 
CTTATTTAAT GAAAGACTGT ACAAAGTATA AGT CTTAGAT GTATATATTT CCTATATTGT 
TTTCAGTGTA CATGGAATAA CATGTAATTA AGTACTATGT ATCAATGAGT AACAGGAAAA 
TTTTAAAAAT ACAGATAGAT ATATGCTCTG CATGTTACAT AAGATAAATG TGCTGAATGG 
TTTTCAAATA AAAATGAGGT ACTCT CCTGG AAATATTAAG 



Seq ID NO: 411 Protein sequence 
Protein Accession #: NP 001556.1 



1 11 21 31 41 51 

1 1 1 I I I 

MNQTAILICC LIFLTLSGIQ GVPLSRTVRC TCISISNQPV NPRSLEKLEI IPASQFCPRV 

EIIATMKKKG EKRCLNPESK AIKNLLKAVS KEMSKRSP 



Seq ID NO: 412 DNA sequence 

Nucleic Acid Accession #: XM_057014 

Coding sequence: 143.. 874 



1 11 

I I 
GGGAGGGAGA GAGGCGCGCG 

CGCGGCGGAG CCAGACGCTG 

CGCTGCCCGG CAGCCGGGAG 

CCGCGGCCTC CTGCTGCTCC 

CCCCAAGGGG AAGCAAAAGG 

AATGTGCTTA CAAGGGCCAG 

CATTCCGGGT ACACCTGGGA 

TCTGAGGGAA AGCTTTGAGG 

ATTGAATTAT GGCATAGATC 

AAATAGTGCT CTAAGAGTTT 

CTGTCAGCGT TGGTATTTCA 

AG CT ATAATT TATTTGGACC 

CACTTCTTCT GTGGAAGGAC 

CTGGGTTGGC ACTTGTTCAG 

TTCTCGCATC ATTATTGAAG 

TTTTTTTATT ATGCCTTGGA 

CATCTGAATG AAAAGCAAAG 

TTTAAATCTA GCATTATTCA 

TGGTTAGAAT ACTTTCTTCA 

GGTCTTTTGT TTTTTCTCTT 

TGTACAATTT GTAAATGT T A 

CAACCTTAAA AAAAAAAAAA 



21 31 

I I 
GGTGAAAGGC GCATTGATGC 

ACCACGTTCC TCTCCTCGGT 

CCATGCGACC CCAGGGCCCC 

TGCTGCTGCA GCTGCCCGCG 

CGCAGCTCCG GCAGAGGGAG 

CAGGAGTGCC TGGTCGAGAC 

TCCCAGGTCG GGATGGATTC 

AGTCCTGGAC ACCCAACTAC 

TTGGGAAAAT TGCGGAGTGT 

TGTTCAGTGG CTCACTTCGG 

CATTCAATGG AG CTG AATGT 

AAGGAAGCCC TGAAATGAAT 

TTTGTGAAGG AATTGGTGCT 

ATTACCCAAA AGGAGATGCT 

AACTACCAAA ATAAATGCTT 

ATGGTTCACT TAAATGACAT 

CTAAATATGT TTACAGACCA 

TTTTGCTTCA ATCAAAAGTG 

TAGT CACATT CTCTCAACCT 

AGTATAGCAT TTTTAAAAAA 

AGAATTTTTT TTATATCTGT 

AAAA 



41 51 

I 1 
AGCCTGCGGC GGCCTCGGAG 

CTCCTCCGCC TCCAGCTCCG 

GCCGCCTCCC CGCAGCGGCT 

CCGTCGAGCG CCTCTGAGAT 

GTGGTGGACC TGTATAATGG 

GGGAGCCCTG GGGCCAATGG 

AAAGGAGAAA AGGGGGAATG 

AAGCAGTGTT CATGGAGTTC 

ACATTTACAA AGATGCGTTC 

CTAAAATGCA GAAATGCATG 

TCAGGACCTC TTCCCATTGA 

TCAACAATTA ATATTCATCG 

GGATTAGTGG ATGTTGCTAT 

TCTACTGGAT GGAATTCAGT 

TAATTTTCAT TTGCTACCTC 

TTTAAATAAG TTTATGTATA 

AAGTGTGATT TCACACTGTT 

GTTTCAATAT TTTTTTTAGT 

ATAATTTGGA ATATTGTTGT 

ATATAAAAGC TACCAATCTT 

TAAATAAAAA TTATTTCCAA 



Seq ID NO: 413 Protein sequence 
Protein Accession #: XP 057014 



1 11 21 31 41 51 

i 1 1 1 I I 

MRPQGPAASP QRLRGLLLLL LLQLPAPSSA SEIPKGKQKA QLRQREWDL YNGMCLQGPA 

GVPGRDGSPG ANGIPGTPGI PGRDGFKGEK GECLRESFEE SWTPNYKQCS WSSLNYGIDD 

GKIAECTFTK MRSNSALRVL FSGSLRLKCR NACCQRWYFT FNGAECSGPL PIEAIIYLDQ 

GSPEMNSTIN IHRTSSVEGL CEGIGAGLVD VAIWVGTCSD YPKGDASTGW NSVSRIIIEE 

LPK 
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Seq ID NO: 414 DNA sequence 

Nucleic Acid Accession #: XM_084007 

Coding sequence: 138.. 2405 



PCT/US02/12476 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



i 

1 

CTCGTGCCGA 
CCAGTGGGCC 
GCGGAGACGA 
TCTCTGTCAC 
AAATTAGTCC 
ATCATCTACA 
TCAGAAAATT 
ACCACGACCA 
AGCATCACTC 
CTGCTTCTGG 
GTAAAGATCC 
GAAGGAATGT 
TCTCTGAAGG 
CCAAAGATGT 
TGGCTGGTAG 
GAAACACAAA 
GCATGGGCAT 
TCAACCAAAT 
CTCCAAAGAC 
TCAGTTTCCT 
AATTTCTCCT 
TACACCTTCT 
CAATGGAAAT 
GTGCCTATTT 
TTCTTGTTGA 
AGAAGAAACC 
CTCAACTTTC 
GAGGAGACTC 
AAGAGGTCAT 
GGTGCAAGAA 
TTCACCACCA 
CTCACAGTCA 
TGGCCTGGAT 
GTGCTGCTTT 
ATGAGTTGCC 
AGCAGGCTGT 
GAATTTT CAT 
GCTTATTCAT 
GTGACCATGG 
GTTTTGGAAT 
TCTAGTTAAG 
AGGGAGATGA 
TTGTATTGAA 
TATTCTATCT 
TAAACAAGAG 
TTTTCAAGAA 
TGTTTAGGAA 
AGCAAAGAAA 
AAAAATCACA 
CAGAATTAGT 
GTAGTGAGCA 
AAATATATTT 
TTCGTGCGGG 
TATTGCCAAG 
CAAAATTATC 
TCATTTGATT 
GAG CAATTGT 
GATGTTTCTT 



11 

i 

ATTCGGCACG 
CGTGTGGAAC 
AGGCGCAATG 
AAATCCCCTT 
GAATTGGGAA 
ACAGCTTTTC 
ACTTCAAAAT 
T CACTCAG AC 
AGACCACGAG 
TAAAAATAAG 
T AG AAACAG C 
CAAGGACAGT 
AACTCACTTT 
AAGCAGCTCC 
GAAAACAAAT 
TGAAAATCCT 
CCAGGTTCCG 
TGATGCTAGA 
CTATTCATTA 
GTCTCTGCTG 
GAGTTTCCTT 
TCCACATTCT 
GAAAAGAGGA 
TGATTCCACG 
ACATGTCCTC 
TGAAAATGAT 
AACAAATGAG 
ACAAGAGCCC 
GATAGCTCAT 
T AAATG CC AT 
TCATGACTAC 
CAGCCAGCGC 
GGTGATAATG 
TACTGAAGGC 
TCATGAATTA 
CCTTTATAAT 
TGGT CATTAT 
GTATGTTGCT 
ATGTAGCCGC 
TATGTTACTT 
GTTT AAATG C 
GTTTGTATGC 
TATTGCTGTC 
TGGAGATAAA 
ATTTGGCATG 
CTAACACAGT 
TAAGAATGTG 
TAAAGGAGAA 
AAATTTGTTG 
ATAGAGTACA 
CTCTCATATA 
AATGAATTCA 
TTATATACCA 
TT AT AT AT CA 
AGAGTAGTAA 
CGATTCAGAA 
CTTTATATAC 
TTTTACACAA 



21 
I 

AGACCGCGTG 
CAAACCTGCG 
GCGAGGAAGT 
CATGAACTAA 
T C TGG CAT T A 
TACCGCTATG 
ATAGGCATAG 
CACGAGCATC 
CATCACTCTG 
CGAAAAGCTC 
CAGGGGAAAG 
GTTAGTGCTA 
CTAGAGACAA 
ACTCCACCCA 
GAATCTGTGA 
CAGGAGTGTT 
CTGAATGCAA 
TCTTGTCTGA 
CAAATAGCCT 
GGGGTTATCT 
GTGGCACTGG 
CATGCAAGTC 
CCACTTTTCA 
TGGAAGGGTC 
ACATTGATCA 
GATGATGTGG 
GAGAAAGTAG 
TCCCACTTTG 
GCTCATCCAC 
TCACATTTCC 
CATCATATTC 
TACT C T CGGG 
GGTGATGGCC 
TTATCAAGTG 
GGTGACTTTG 
GCATTGTCAG 
GCTGAAAATG 
CTGGTTGATA 
TGGGGGTATT 
ATTTCCATAT 
TAGAGTAGCT 
TGTACTATGC 
TGTTACAAAG 
ATCTGTATGT 
ACATGTTCTG 
TATTCCTATA 
CATGAAGCCT 
AAGAGAAGAA 
TAAATTAGAG 
TTCATTAAAC 
CTAATTAGTG 
AGCAATATAC 
GATGAGTACA 
CCAAAAGCTG 
AACTTTGATA 
AGTACTTTGA 
GGTACTGTAG 
TAAATTCCTT 



31 
I 

TTCGCGCCTG 
CGCGTGGCCG 
TATCTGTAAT 
AAGCAGCTGC 
ATGTTGACTT 
GAGAAAATAA 
ATAAGATTAA 
ACTCAGACCA 
ACCATGATCA 
TTTGCCCAGA 
GAGCTCACCG 
GTGAAGTGAC 
TAGAGACTCC 
GTGTCACATC 
GTGAGCCCCG 
TCAATGCATC 
CAGAGTTCAA 
TTCATACAAG 
GGGTTGGTGG 
TAGTGCCTCT 
CCGTTGGGAC 
ACCACCATAG 
GTCATCTGTC 
TAACAGCTCT 
AACAATTTAA 
AGATTAAGAA 
ATACAGATGA 
ATTCTCAGCA 
AGGAAGTCTA 
ACGATACACT 
TCCAT CATCA 
AGGAGCTGAA 
TGCACAATTT 
GTTTAAGTAC 
CTGTTCTACT 
CCATGCTGGC 
TTTCTATGTG 
TGGTACCTGA 
TCTTTTTACA 
TTGAACATAA 
TAAAAAGTTG 
AGCGTTTAAA 
TCAGTTAAAG 
GCAATTCACC 
TATGTTTCAG 
CTGGATTTTA 
AAAATACCAA 
TCTGAGAATT 
GGGAGAAATT 
ATTTTTGTCA 
TACATTTAAC 
ACTTGACCAA 
GTGAGTAGTT 
TATGACTGGA 
TATATGAGGA 
TATCT CTCAG 
CCATACTAGG 
AT AT C AGCTT 



41 

1 

GTAGAGATTT 
GGCCGTGGGA 
CTTGATCCTG 
TTTCCCCCAG 
GGCAATTTCC 
TTCTTTGTCA 
AAGAATCCAT 
TGAGCGTCAC 
TCACTCCCAC 
CC ATG ACT CA 
ACCAGAACAT 
CTCAACTGTG 
AAGACCTGGA 
AAAGAGCCGG 
AAAAGGCTTT 
AAAGCTACTG 
CTATCTCTGT 
TGAAAAGAAG 
TTTTATAGCC 
CATGAATCGG 
TTTGAGTGGT 
TCATAGCCAT 
TTCTCAAAAC 
AGGAGGCCTG 
AGATAAGAAG 
GCAGTTGTCC 
TCGAACTGAA 
GCCTGCAGTC 
CAATGAATAT 
CGGCCAGTCA 
CCACCACCAA 
AGATGCCGGC 
CAGCGATGGC 
TTCTGTTGCT 
AAAGGCTGGC 
GTATCTTGGA 
GATATTTGCA 
AATGCTGCAC 
GAATGCTGGG 
AATCGTGTTT 
TCATAGTTTC 
GTTAGTGGGT 
GTACGTTTTA 
GGTATTACCA 
GGAAAAATGT 
GGTCTCTGAA 
GAAAGCTTAT 
GGGGAGGCAT 
TAGAATTAAG 
GGATTATTTC 
TTTGTATAAT 
GAAATTGGAA 
TATGTATCAC 
TGTTCTGGTT 
TATTAAAACT 
TGCTTCAGTG 
CCTGTCTGTG 
G 



51 
I 

CTCGAAGACA 60 

CAACGAGGCC 120 

ACCTTTGCCC 180 

ACCACTGAGA 240 

ACACGGCAAT 300 

GTTGAAGGGT 360 

ATACACCATG 420 

TCAGACCATG 480 

CATAAT CATG 540 

GATAGTTCAG 600 

GCCAGTGGTA 660 

TACAACACTG 720 

AAACTCTTCC 780 

GTGAGCCGGC 840 

ATGTATTCCA 900 

ACATCT CATG 960 

CCAGCCATCA 1020 

GCTGAAATCC 1080 

ATTTCCATCA 1140 

GTGTTTTTCA 1200 

GATGCTTTTT 1260 

GAAGAACCAG 1320 

ATAGAAGAAA 1380 

TATTTCATGT 1440 

AAAAAGAATC 1500 

AAGTATGAAT 1560 

GGCTATTTAC 1620 

TTGGAAGAAG 1680 

GTACCCAGAG 1740 

GACGATCT CA 1800 

AACCACCATC 1860 

GTCGCCACTT 1920 

CTAGCAATTG 1980 

GTGTTCTGTC 2040 

ATGACCGTTA 2100 

ATGGCAACAG 2160 

CTTACTGCTG 222 0 

AATGATGCTA 2280 

ATGCTTTTGG 23 40 

CGTATAAATT 2400 

AGTAGGTCAT 2460 

TTTGTGATTT 2 520 

ATATTTAAGT 2580 

GTTTATTATG 2640 

CTTTAATGCT 270 0 

GAACTGCTGG 2760 

ACTGAATTTA 2820 

AGATTCTTAT 2 880 

TATAAAAAGG 2 940 

CCGTAAAAAC 30 00 

ACAGAAATCT 3 0 60 

TTTCAAAATG 3120 

CAGACTGGGT 3180 

ACCTGGTTTA 3240 

ACACTAAGTA 33 00 

CTATCATTGT 3360 

GCATTCTCTA 3420 



Seq ID NO: 415 Protein sequence 
Protein Accession #: XP 084007 



70 



75 



80 



85 



MARKLSVILI 
FYRYGENNSL 
EHHSDHDHHS 
SVSASEVTST 
NESVSEPRKG 
RSCLIHTSEK 
LVALAVGTLS 
TWKGLTALGG 
EEKVDTDDRT 
HSHFHDTLGQ 
MGDGLHNFSD 
NALSAMLAYL 
RWGYFFLQNA 



11 
I 

LTFALSVTNP 
SVEGFRKLLQ 
HHNHAASGKN 
VYNTVSEGTH 
FMYSRNTNEN 
KAEIPPKTYS 
GDAFLHIiLPH 
LYFMFLVEHV 
EGYLRADSQE 
SDDL I HHHHD 
GLAIGAAFTE 
GMATGIFIGH 
GMLLGFGIML 



21 



LHELKAAAFP 
NIGIDKIKRI 
KRKALCPDHD 
FLETIETPRP 
PQECFNASKL 
LQIAWVGGFI 
SHASHHHSHS 
LTLIKQFKDK 
PSHFDSQQPA 
YHHILHHHHH 
GLSSGLSTSV 
YAENVSMWIF 
LISIFEHKIV 



31 
I 

QTTEKISPNW 
HIHHDHDHHS 
SDSSGKDPRN 
GKLFPKDVSS 
LTSHGMGIQV 
AISIISFLSL 
HEEPAMEMKR 
KKKNQKKPEN 
VLEEEEVMIA 
QNHHPHSHSQ 
AVFCHELPHE 
ALTAGLFMYV 
FRINF 



41 
I 

ESGINVDLAI 
DHEHHSDHER 
SQGKGAHRPE 
STPPSVTSKS 
PLNATEFNYL 
LGVILVPLMN 
GPLFSHLSSQ 
DDDVEIKKQL 
HAHPQEVYNE 
RYSREELKDA 
LGDFAVLLKA 
ALVDMVPEML 



51 
I 

STRQYHLQQL 60 

H SDHEHH SDH 12 0 

HASGRRNVKD 180 

RVSRLAGRKT 240 

CPAIINQIDA 300 

RVFFKFLLSF 360 

NIEESAYFDS 420 

SKYESQLSTN 480 

YVPRGCKNKC 540 

GVATLAWMVI 600 

GMTVKQAVLY 660 

HNDASDHGCS 720 



Seq ID NO: 416 DNA sequence 

Nucleic Acid Accession #: NM_015419.1 

Coding sequence: 1..8487 



338 



WO 02/086443 



1 11 21 31 41 51 

I I I I I I 

ATGCCCAAGC GCGCGCACTG GGGGGCCCTC TCCGTGGTGC TGATCCTGCT TTGGGGCCAT 60 

CCGCGAGTGG CGCTGGCCTG CCCGCATCCT TGTGCCTGCT ACGTCCCCAG CGAGGTCCAC 120 

TGCACGTTCC GATCCCTGGC TTCCGTGCCC GCTGGCATTG CTAGACACGT GGAAAGAATC 180 

AATTTGGGGT TTAATAGCAT ACAGGCCCTG TCAGAAACCT CATTTGCAGG ACTGACCAAG 240 

TTGGAGCTAC TTATGATTCA CGGCAATGAG ATCCCAAGCA TCCCCGATGG AGCTTTAAGA 300 

GACCTCAGCT CTCTTCAGGT TTTCAAGTTC AGCTACAACA AGCTGAGAGT GATCACAGGA 3 60 

CAGACCCTCC AGGGTCTCTC TAACTTAATG AGGCTGCACA TTGACCACAA CAAGAT CG AG 420 

TTTATCCACC CTCAAGCTTT CAACGGCT T A ACGTCTCTGA GGCTACTCCA TTTGGAAGGA 480 

AATCTCCTCC ACCAGCTGCA CCCCAGCACC TTCTCCACGT TCACATTTTT GGATTATTTC 540 

AGACT CT CCA CCATAAGGCA CCTCTACTTA GCAGAGAACA TGGTTAGAAC TCTTCCTGCC 600 

AGCATGCTTC GGAACATGCC GCTTCTGGAG AATCTTTACT TGCAGGGAAA TCCGTGGACC 660 

TGCGATTGTG AGATGAGATG GTTTTTGGAA TGGGATGCAA AATCCAGAGG AATTCTGAAG 720 

TGTAAAAAGG ACAAAGCTTA TGAAGGCGGT CAGTTGTGTG CAATGTGCTT CAGTCCAAAG 780 

AAGTTGTACA AACATGAGAT ACACAAGCTG AAGGACATGA CTTGTCTGAA GCCTTCAATA 840 

GAGTCCCCTC TGAGACAGAA CAGGAGCAGG AGTATTGAGG AGGAGCAAGA ACAGGAAGAG 900 

GATGGTGGCA GCCAGCTCAT CCTGGAGAAA TTCCAACTGC CCCAGTGGAG CATCTCTTTG 960 

AATATGACCG ACGAGCACGG GAACATGGTG AACTTGGTCT GTGACATCAA GAAACCAATG 102 0 

GATGTGTACA AGATTCACTT GAACCAAACG GATCCTCCAG ATATTGACAT AAATGCAACA 10 80 

GTTGCCTTGG ACTTTGAGTG T CCAATGACC CGAGAAAACT ATGAAAAGCT ATGGAAATTG 1140 

ATAGCATACT ACAGTGAAGT T CCCGTG AAG CTACACAGAG AGCTCATGCT CAGCAAAGAC 12 0 0 

CCCAGAGTCA GCTACCAGTA CAGGCAGGAT GCTGATGAGG AAGCTCTTTA CTACACAGGT 12 60 

GTGAGAGCCC AGATTCTTGC AGAACCAGAA TGGGTCATGC AGCCATCCAT AGATATCCAG 132 0 

CTGAACCGAC GTCAGAGTAC GGCCAAGAAG GTGCTACTTT CCTACTACAC CCAGTATTCT 13 80 

CAAACAATAT CCACCAAAGA TACAAGGCAG GCTCGGGGCA GAAGCTGGGT AATGATTGAG 1440 

CCTAGTGGAG CTGTGCAAAG AGATCAGACT GTCCTGGAAG GGGGTCCATG CCAGTTGAGC 150 0 

TGCAACGTGA AAGCTTCTGA GAGTCCATCT ATCTTCTGGG TGCTTCCAGA TGGCTCCATC 15 60 

CTGAAAGCGC CCATGGATGA CCCAGACAGC AAGTTCTCCA TTCTCAGCAG TGGCTGGCTG 162 0 

AGGATCAAGT CCATGGAGCC ATCTGACTCA GGCTTGTACC AGTGCATTGC TCAAGTGAGG 1680 

GATGAAATGG ACCGCATGGT ATATAGGGTA CTTGTGCAGT CTCCCTCCAC TCAGCCAGCC 1740 

GAGAAAGACA CAGTGACAAT TGGCAAGAAC CCAGGGGAGT CGGTGACATT GCCTTGCAAT 18 0 0 

GCTTTAGCAA TACCCGAAGC CCACCTTAGC TGGATTCTTC CAAACAGAAG GATAATTAAT 1860 

GATTTGGCTA ACACATCACA TGTATACATG TTGCCAAATG GAACTCTTTC CATCCCAAAG 192 0 

GTCCAAGTCA GTGATAGTGG TTACTACAGA TGTGTGGCTG TCAACCAGCA AGGGGCAGAC 198 0 

CATTTTACGG TGGGAATCAC AGTGACCAAG AAAGGGTCTG GCTTGCCATC CAAAAGAGGC 2040 

AGACGCCCAG GTGCAAAGGC TCTTTCCAGA GTCAGAGAAG ACAT CGTGGA GGATGAAGGG 2100 

GGCTCGGGCA TGGGAGATGA AGAGAACACT TCAAGGAGAC TTCTGCATCC AAAGGACCAA 2160 

GAGGTGTTCC TCAAAACAAA GGATGATGCC ATCAATGGAG ACAAGAAAGC CAAGAAAGGG 2220 

AGAAGAAAGC TGAAACTCTG GAAGCATTCG GAAAAAGAAC CAGAGACCAA TGTTGCAGAA 22 80 

GGT CGCAGAG TGTTTGAATC TAGACGAAGG ATAAACATGG CAAACAAACA GATTAATCCG 2340 

GAGCGCTGGG CTGATATTTT AGCCAAAGTC CGTGGGAAAA ATCTCCCTAA GGGCACAGAA 240 0 

GTACCCCCGT TGATTAAAAC CACAAGTCCT CCATCCTTGA GCCTAGAAGT CACACCACCT 24 60 

TTTCCTGCTG TTTCTCCCCC CTCAGCATCT CCTGTGCAGA CAGTAACCAG TGCTGAAGAA 252 0 

TCCTCAGCAG ATGTACCTCT ACTTGGTGAA GAAGAGCACG TTTTGGGTAC CATTTCCTCA 25 8 0 

GCCAGCATGG GGCTAGAACA CAACCACAAT GGAGTTATTC TTGTTGAACC TGAAGTAACA 2640 

AGCACACCTC TGGAGGAAGT TGTTGATGAC CTTTCTGAGA AGACTGAGGA GATAACTTCC 2 700 

ACTGAAGGAG ACCTGAAGGG GACAGCAGCC CCTACACTTA TATCTGAGCC TTATGAACCA 2 760 

TCTCCTACTC TGCACACATT AGACACAGT C TATGAAAAGC CCACCCATGA AGAGACGGCA 2 820 

ACAGAGGGTT GGTCTGCAGC AGATGTTGGA TCGTCACCAG AGCCCACATC CAGTGAGTAT 2 880 

GAGCCTCCAT TGGATGCTGT CTCCTTGGCT GAGTCTGAGC CCATGCAATA CTTTGACCCA 2 940 

GATTTGGAGA CTAAGTCACA ACCAGATGAG GATAAGATGA AAGAAGACAC CTTTGCACAC 3 000 

CTTACTCCAA CCCCCACCAT CTGGGTTAAT GACTCCAGTA CATCACAGTT ATTTGAGGAT 3 060 

T CT ACTAT AG GGGAACCAGG TGTCCCAGGC CAATCACATC TACAAGGACT GACAGACAAC 312 0 

AT CCACCTTG TGAAAAGTAG TCTAAGCACT CAAGACACCT TACTGATTAA AAAGGGTATG 3180 

AAAGAGATGT CTCAGACACT ACAGGGAGGA AATATGCTAG AGGGAGACCC CACACACTCC 3240 

AGAAGTTCTG AGAGTGAGGG CCAAGAGAGC AAAT CCATCA CTTTGCCTGA CTCCACACTG 33 0 0 

GGTATAATGA GCAGTATGTC TCCAGTTAAG AAGCCTGCGG AAACCACAGT TGGTACCCTC 33 60 

CTAGACAAAG ACACCACAAC AGTAACAACA ACACCAAGGC AAAAAGTTGC TCCGTCATCC 3 42 0 

AC CAT GAG CA CTCACCCTTC TCGAAGGAGA CCCAACGGGA GAAGGAGATT ACGCCCCAAC 3 480 

AAATTCCGCC ACCGGCACAA GCAAACCCCA CCCACAACTT TTGCCCCATC AGAGACTTTT 3540 

TCTACTCAAC CAACTCAAGC ACCTGACATT AAGATTTCAA GTCAAGTGGA GAGTTCTCTG 3 60 0 

GTT CCTACAG CTTGGGTGGA TAACACAGTT AATACCCCCA AACAGTTGGA AATGGAGAAG 3 660 

AATGCAGAAC CCACATCCAA GGGAACACCA CGGAGAAAAC ACGGGAAGAG GCCAAACAAA 3 720 

CATCGATATA CCCCTTCTAC AGTGAGCTCA AGAGCGTCCG GATCCAAGCC CAGCCCTTCT 3 780 

CCAGAAAATA AACATAGAAA CATTGTTACT CCCAGTTCAG AAACTATACT TTTGCCTAGA 3 840 

ACTGTTTCTC TGAAAACTGA GGGCCCTTAT GATTCCTTAG ATTACATGAC AACCACCAGA 3 90 0 

AAAATATATT CATCTTACCC TAAAGT CCAA GAGACACTTC CAGTCACATA TAAACCCACA 3 960 

TCAGATGGAA AAGAAATTAA GGATGATGTT GCCACAAATG TTGACAAACA TAAAAGTGAC 4020 

ATTTTAGTCA CTGGTGAATC AATTACTAAT GCCATACCAA CTTCTCGCTC CTTGGTCTCC 4080 

ACTATGGGAG AATTTAAGGA AGAATCCTCT CCTGTAGGCT TTCCAGGAAC TCCAACCTGG 4140 

AATCCCTCAA GGACGGCCCA GCCTGGGAGG CTACAGACAG ACATACCTGT TACCACTTCT 42 00 

GGGGAAAAT C TTACAGACCC TCCCCTTCTT AAAGAGCTTG AGGATGTGGA TTTCACTTCC 42 60 

GAGTTTTTGT CCTCTTTGAC AGTCTCCACA CCATTTCACC AGGAAGAAGC TGGTTCTTCC 432 0 

ACAACTCTCT CAAGCATAAA AGTGGAGGTG GCTTCAAGTC AGGCAGAAAC CACCACCCTT 4380 

GAT CAAGAT C ATCTTGAAAC CACTGTGGCT ATTCTCCTTT CTGAAACTAG ACCACAGAAT 4440 

CACACCCCTA CTGCTGCCCG GATGAAGGAG CCAGCATCCT CGTCCCCATC CACAATTCTC 4500 

ATGTCTTTGG GACAAACCAC CACCACTAAG CCAGCACTTC CCAGTCCAAG AATATCTCAA 4560 

GCAT CTAGAG ATTCCAAGGA AAATGTTTTC TTGAATTATG TGGGGAATCC AGAAACAGAA 4620 

GCAACCCCAG TCAACAATGA AGGAACACAG CATATGTCAG GG C CAAATG A ATTATCAACA 4680 

CCCTCTTCCG ACCGGGATGC ATTTAACTTG TCTACAAAGC TGGAATTGGA AAAG CAAGT A 4740 

TTTGGTAGTA GGAGTCTACC ACGTGGCCCA GAT AG C CAAC GCCAGGATGG AAGAGTT CAT 4800 

GCTTCTCATC AACTAACCAG AGTCCCTGCC AAACCCATCC TACCAACAGC AACAGTGAGG 4860 

CTACCTGAAA TGTCCACACA AAGCGCTTCC AGATACTTTG TAACTTCCCA GTCACCTCGT 4 920 

CACTGGACCA ACAAACCGGA AATAACTACA TATCCTTCTG GGGCTTTGCC AGAGAACAAA 4 980 

CAGTTTACAA CTCCAAGATT ATCAAGTACA ACAATTCCTC TCCCATTGCA CATGTCCAAA 5040 
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CCCAGCATTC CTAGTAAGTT 
GTGTTTGGAA ATAACAACAT 
AGAATTCCTC AT T AT T CC AA 
CCACAGTTGG GAGTCACCCG 
GAGAGAAAAG TTATTCCAGG 
GACTTTGGCC CTCCGGCACC 
ACTAACTTAC AGAATATCCC 
TCTTCTGTCC AGTCCTCAGG 
CCTCCTGCAT CCAAATTCTG 
CAGACTGTGT CCGTCACCGC 
CCAAAGCCTT TCGTTACTTG 
AGGATACAAC GGTTTGAGGT 
CAAGATCGAG G CCAGT AT AT 
GTCTTGCTTT CGGTCACCGT 
ACTGTCTACC TGGGAGACAC 
CAAATTTCCT GGATCTTCCC 
CGCATCACCC TGCACGAAAA 
GGCGTCTATA AGTGCGTGGC 
CACGTGGCGG CACTGCCCCC 
CCGGGGCTCA GCATTCACAT 
TGGGTGCTCG GGGACGGTAC 
GTTTTCCCCA ACGGGACGCT 
GAGTGCGTGG CCGCCAACCT 
CGTGCAGCAG CCAACGCGCG 
GGAGGAACCC TCAAGCTGGA 
AGGCTGCCGT CCAAGAGGAT 
TTTGCCAATG GGACCCTGGT 
TGCGTAGCTC GAAATAAGGT 
AAACCGGCCA AGATTGAACA 
CTGAAAGTGG ACTGTGTGGC 
GACGGGAGTC TGGTGAACTC 
TATGTCGTCT TCAACAATGG 
GACTACACCT GCTTTGCTGA 
GTGGTGACAG CGCCCGCCAC 
GGAGACGTGG TCACTGTAG C 
TTGTCCCCAA CCAACAAGGT 
GGCACTCTCC TTATTCAGAA 
AGGAACAGCG CGGGAGAGGA 
AAGATCAACG GTAACCCCAA 
CGGAAACTGA TTGACTGCAA 
CCCGAGGGTG TGGTTCTGCC 
GGTTCCCTGG ACATCAGGAG 
CGCAACGAGG GAGGGGAGGC 
AAACCCATCT TCCACGACCC 
AGCCTCAACT GCTCTGCCGC 
GGCACCGATC TGCAGAGTGG 
CTACACATTA GCGGTCTCTC 
GCCGCTGGCC ACACGGAGAG 
AAGCAGTATC ATAACCTGGT 
CCTCCCGGGG CTGGGCAGGG 
GGCCCCCAAA CCCTGGGACG 
GCCT CGGTGT TTGACAGGGG 
GTCACCAGCA TCCCCGTGAT 
CCGGTCATCT ACACCCGGCC 
CCCAAAGCTG ACATCACGTG 
GCTCGTCTGT ATGGAAACAG 
ACACAGAGAG ATGCCGGCTT 
AAAACAACTT ACATCCACGT 
ACAACAAAGC GGGGTTTGTA 
GTCACAGTGC ATGGTGGCCT 
GTTGGGAAAA GGAAGCAATG 
CTTTTGTGTT TACATCATGC 
TTTCTTCTTT TGCAAATGCC 
ACATTCATCA AAAATAAGCC 
TCACCTAGTT AACCTGCTGC 
TCTTTCAGTT ATTTCCTCTG 
CAGAGTGACT GATATATATA 
TTTATATGAA AAAAGAAAAA 
TATATATTTT TTCCTTTCAA 
ATTAAAATTA ATAAATTATT 
ATATAATTTT AAAAAATTTC 
CCTTCTCCAG GAACCCTCCA 
TTTTTGTTGA AAGCTGTGCT 
AACTTTACAG AATTGAATCT 
CTGGCTTGTC CATCTGGTCT 
CCATGAATAA TACACGACCT 
ATACTGTACA TTTGATAATA 
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TACTGACCGA 
CCCTGAGGCA 
TGGAAG ACT C 
GAGACCCCAG 
TTCCTACAAC 
TCCGTTGTTG 
TATGGTCTCT 
AAGCTTCCAC 
GTCTCTTGGG 
TGAGACAGAC 
GACAAAGGTT 
TCTCAAGAAC 
GTGCACCGCC 
GCAGCAACCT 
CATTGCAATG 
TGACAGGAGG 
CCGGACCCTT 
CAGCAATGCA 
CGTTATCCAC 
TCACTGCACT 
CCAGATCCGC 
CTACATCCGC 
GGTAGGCTCC 
CAT CACGGGC 
CTGCAGCGCC 
GATCGACGCG 
GGTGAAATCA 
TGGTGATGAC 
CAAGGAGGAG 
CACCGGGCTT 
CTTCATGCAG 
GACACTCTAC 
AAATCAGGTC 
CATCCGGAAC 
CTGTGAGGCC 
GATCCCCACC 
AGCCCAGCGT 
TAGGAAGACG 
CCCCATCACC 
AGCTGAAGGC 
AGCTCCATAC 
TTTGAGGAAG 
GAGGTTGATC 
GATCAGCGAG 
GGGGACCCCG 
ACAGCAGCTG 
CTCGGTGGAC 
GCTGGTCTCC 
CAGCAT CATC 
ACGTTTCTCC 
CGTTTCTCTT 
TACCTATGTA 
TGTGATCGCC 
CGGGAACACC 
GGAGTTACCG 
ATTTCTTCAC 
CTACAAGTGC 
CTTCTGAAAT 
AGGGAAGCCA 
CTGGTGGGTT 
CAGACACGAG 
CAGGGGCTTC 
ACT CGACTGC 
ATAGACATGA 
AGTTTTTACA 
TCACTTCAAA 
TATATATTTT 
CATTTCTTCC 
ATCAGACGAT 
GGTCTTTACA 
TCTCCAACCT 
GTGGGGAAGG 
CAGAGGAGGT 
AGAGTCTTCC 
AAGGTGGCTG 
GTTATTTCCA 
AAATAATATT 



AGAACTGACC 
AGAAACCCAG 
CCTTTCTTTA 
ATACCCACTT 
AGGATACATT 
CACACTCCGC 
TCCACCCAGA 
CAGAGCAGCT 
GAAAAGCCCC 
ACTGTGTTCC 
T CCACAGGAG 
GGTACCTTAG 
AGCAACCTGC 
CAAATCCTAG 
GAGTGTCTGG 
GTGTGGCAAA 
TCCATCAAGG 
GCCGGGGCGG 
CAGGAGAAGC 
GCCAAGGCTG 
CCCTCGCAGT 
AACCTCGCGC 
GCGCGCAGGA 
ACCTCCCCGC 
TCGGGGGACC 
CTCTTCAGTT 
GTGACGGACA 
TACGTGGTGC 
AACGACCACA 
CCCAATCCCG 
TCGGATGACA 
TTTAACGAAG 
GGGAAGGACG 
AAGACTTACT 
AAAGGAGAAC 
TCCTCTGAGA 
TCTGACAGCG 
GTGTGGATTC 
ACCGTGCGGG 
ATCCCCACCC 
TATGGAAACC 
AGCGACTCCG 
GTGCAGCTCA 
AAGATCACGG 
ACACCCAGCC 
CAGCGCTTCT 
GCTGGGGCCT 
CTGAAGGTGG 
AATGGTGAGA 
TGGACGCTCC 
CTGGACAATG 
TGCAGGATGG 
TATCCTCCCC 
GTGAAACTGA 
GATAAGTCGC 
CCCCAGGGAT 
ATGGCAAAAA 
GTGGATTCCA 
GGTTGGGGAA 
TCAAGTTGAG 
AAGGAGGGCT 
ATTCAGGGTG 
CTTCATAAGC 
ACAACACCTC 
TGATAGACTT 
ACTCCAGCTT 
AATT CAGAGT 
TGGAACTCAC 
GAGACTAGAA 
AGACTTGGAT 
CCTTCAAATT 
CTGCGATATT 
GAGAGGAGAG 
CCGAAAAGCC 
CTTCTTCCCC 
TGACTGCTTT 
CTCCCAAAAA 



AATTCAATGG 

TTGGAAAGCC 

CCAACAAGAC 

CTCCTGCCCC 

CCCATAGCAC 

AGACCACGGG 

GTTCTATCTC 

CAAAGTTCTT 

AAATCCTCAC 

CCTGTGAGGC 

CTCTTATGAC 

TGATACGGAA 

ACGGCCTGGA 

CCTCCCACTA 

CCAAAGGGAC 

CTGTGTCCCC 

AGGCGTCCTT 

ACAGCCTGGC 

TGGAGAACAT 

CGCCCCTGCC 

TCCTCCACGG 

CCAAGGACAG 

CGGTGCAGCT 

GGAGGACGGA 

CCTGGCCGCG 

TTGATAGCAG 

AAGATGCCGG 

TCAAAGTGGA 

AAGT CTTCTA 

AGATCTCCTG 

GCGGTGGACG 

TGGGGATGAG 

AGATGAGAGT 

TGGCGGTTCA 

CCATGCCCAA 

AGT AT CAGAT 

GCAACTACAC 

ACGT CAACGT 

AGATAGCAGC 

CGAGGGTGTT 

GGAT CACTGT 

TCCAGCTGGT 

CTGTCCTGGA 

CCATGGCGGG 

TGGTGTGGGT 

ACCACAAGGC 

ACCGCTGCGT 

GACTGAAGCC 

CCCTGAAGCT 

CCAATGGCAT 

GCACCCTCAC 

AGACGGAGTA 

GGATCACCAG 

ACTGCATGGC 

ATCTGAAGGC 

CACTGACCAT 

ACATTCTCGG 

GAATGATTGC 

TAGGAGCTCT 

GTTGAT CTTG 

CAGCCTTGCT 

TCTGTGCTCT 

GTCCATAGGA 

ACTACCCCAT 

TGTT CCAGAT 

GCCCAATAAG 

TACATACATA 

TTTTTATATA 

GGAGAAATAC 

ACATTACAGC 

CAGTCACCAC- 

AGATTTCCTT 

GAAGGAGAAA 

CAGAAACTTC 

AGCCATGAGT 

ACTGTATTTT 

AAAAA 



TTACTCCAAA 5100 

TCCCAGTCCA 5160 

TCTTTCTTTT 5220 

AGTAATGAG A 5280 

CTTCCATCTG 5340 

ATCACCCTCA 54 00 

CTTTATAACA 5460 

TGCAGGAGGA 5520 

CAAGTCCCCA 5580 

AACAGGAAAA 5640 

TCCGAATACC 5700 

GGTT CAAGTA 5760 

CAGGATGGTG 5820 

CCAGGACGTC 5880 

CCCAGCCCCC 5940 

CGTGGAGAGC 6000 

CTCAGACAGA 6060 

CATCCGCCTG 6120 

CTCGCTGCCC 6180 

CAGCGTGCGC 6240 

GAACTTGTTT 63 00 

CGGGCGCTAT 63 60 

GAACGTGCAG 6420 

CGTCAGGTAC 6480 

CATCCTCTGG 6540 

AAT CAAGGTG 6600 

AGATTACCTG 6660 

TGTGGTGATG 6720 

CGGGGGTGAC 6780 

GAGCCTCCCA 6840 

CACCAAGCGC 6900 

GGAGGAAGGA 6960 

CAGAGTCAAG 702 0 

GGTGCCCTAT 7080 

GGTGACTTGG 7140 

ATACCAAGAT 7200 

CTGCCTGGTC 7260 

CCAGCCACCC 7320 

CGGGGGCAGT 7380 

ATGGGCTTTT 7440 

CCATGGCAAC 7500 

ATGCATGGCA 7560 

GCCCATGGAG 762 0 

CCACACCATC 7680 

CCTTCCCAAT 7740 

TGACGGCATG 780 0 

GGCCCGCAAT 7860 

AGAAGCAAAC 7920 

CCCCTGCACC 7980 

GCATCTGGAG 8040 

GGTTCGTGAG 8100 

CGGCCCTTCG 8160 

CGAGCCCACC 822 0 

TATGGGGATT 82 80 

AGGGGTTCAG 8340 

CCAGCATGCC 8400 

CAGTGACT CC 8460 

TTAGGAACTG 8520 

TAAATAATGT 8580 

ATCTACAATT 8640 

GAGACACTTT 8700 

GACTGCAATT 8760 

TATCTGAGGA 882 0 

TGAAGACGCA 8880 

TGACAAGTCA 8940 

GATTTAGAAC 9000 

CAGCTACCAT 9060 

ATGTTTTATA 9120 

TTTCTGTCTT 9180 

AGACATGGAA 924 0 

TGTTATATTA 9300 

GTATGCAAAG 93 60 

ACTGCATCAT 9420 

TCTGCAGTAT 9480 

CAGTTTGTGC 9540 

TAAGGTCAAT 9600 
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MPKRAHWGAL SWLILLWGH PRVALACPHP CACYVPSEVH CTFRSLASVP AGIARHVERI 60 

85 NLGFNSIQAL SETSFAGLTK LELLMIHGNE IPSIPDGALR DLSSLQVFKF SYNKLRVITG 12 0 

QTLQGLSNLM RLHIDHNKIE FIHPQAFNGL TSLRLLHLEG NLLHQLHPST FSTFTFLDYF 180 

RLSTIRHLYL AENMVRTLPA SMLRNMPLLE NLYLQGNPWT CD CEMRWFLE WDAKSRGILK 240 



340 



WO 02/086443 



PCT/US02/12476 



CKKDKAYEGG QLCAMCFSPK KLYKHEIHKL KDMTCLKPSI ESPLRQNRSR SIEEEQEQEE 3 00 

DGGSQLILEK FQLPQWSISL NMTDEHGNMV NLVCD I KKPM DVYKIHLNQT DPPDIDINAT 3 60 

VALDFECPMT RENYEKLWKL IAYYSEVPVK LHRELMLSKD PRVSYQYRQD ADEEALYYTG 420 

VRAQILAEPE WVMQPSIDIQ LNRRQSTAKK VLLSYYTQYS QTISTKDTRQ ARGRSWVMIE 480 

5 PSGAVQRDQT VLEGGPCQLS CNVKASESPS IFWVLPDGSI LKAPMDDPDS KFSILiSSGWL 540 

RIKSMEPSDS GLtYQCIAQVR DEMDRMVYRV LVQSPSTQPA EKDTVTIGKN PGESVTLPCN 600 

ALAIPEAHLS WILPNRRIIN DLANTSHVYM LPNGTLSIPK VQVSDSGYYR CVAVNQQGAD 660 

HFTVGITVTK KGSGLPSKRG RRPGAKALSR VREDIVEDEG GSGMGDEENT SRRLLHPKDQ 72 0 

EVFLKTKDDA I NGDKKAKKG RRKLKLWKHS EKE PETNVAE GRRVFESRRR INMANKQINP 780 

10 ERWADILAKV RGKNLPKGTE VPPLIKTTSP PSLSLEVTPP FPAVSPPSAS PVQTVTSAEE 840 

SSADVPLLGE EEHVLGTISS ASMGLEHNHN GVILVEPEVT STPIiEEWDD LSEKTEEITS 90 0 

TEGDL KGTAA PTLISEPYEP SPTLHTLDTV YEKPTHEETA TEGWSAADVG SSPEPTSSEY 960 

EPPLDAVSLA ESEPMQYFDP DLETKSQPDE DKMKEDTFAH LTPTPTIWVN DSSTSQLFED 102 0 

STIGEPGVPG QSHLQGLTDN IHLVKSSLST QDTLLIKKGM KEMSQTLQGG NMLEGDPTHS 1080 

15 RSSESEGQES KSITLPDSTL GIMSSMSPVK KPAETTVGTL LDKDTTTVTT TPRQKVAPSS 1140 

TMSTHPSRRR PNGRRRLRPN KFRHRHKQTP PTTFAPSETF STQPTQAPDI KISSpVESSL 1200 

VPTAWVDNTV NTPKQLEMEK NAEPTSKGTP RRKHGKRPNK HRYTPSTVSS RASGSKPSPS 1260 

PENKHRNIVT PSSETILLPR TVSLKTEGPY DSLDYMTTTR KIYSSYPKVQ ETLPVTYKPT 1320 

SDGKEIKDDV ATNVDKHKSD ILVTGESITN AIPTSRSLVS TMGEFKEESS PVGFPGTPTW 1380 

20 NPSRTAQPGR LQTDIPVTTS GENLTDPPLL KELEDVDFTS EFLSSLTVST PFHQEEAGSS 144 0 

TTLSSIKVEV ASSQAETTTL DQDHLETTVA ILLSETRPQN HTPTAARMKE PASSSPSTIL 1500 

MSLGQTTTTK PALPSPRISQ ASRDSKENVF LNYVGNPETE ATPVNNEGTQ HMSGPNELST 1560 

PSSDRDAFNL STKLELEKQV FGSRSLPRGP DSQRQDGRVH ASHQLTRVPA KP I LPTATVR 162 0 

LPEMSTQSAS RYFVTSQSPR HWTNKPEITT YPSGALPENK QFTTPRLSST TIPLPLHMSK 1680 

25 PSIPSKFTDR RTDQFNGYSK VFGNNN I PEA RNPVGKPPSP RIPHYSNGRL PFFTNKTLSF 1740 

PQLGVTRRPQ IPTSPAPVMR ERKVI PGSYN RIHSHSTFHL DFGPPAPPLL HTPQTTGSPS 1800 

TNLQNIPMVS STQSSISFIT SSVQSSGSFH QSSSKFFAGG PPASKFWSLG EKPQILTKSP 1860 

QTVSVTAETD TVFPCEATGK PKPFVTWTKV STGALMTPNT RIQRFEVLKN GTLVIRKVQV 1920 

QDRGQYMCTA SNLHGLDRMV VLLSVTVQQP QILASHYQDV TVYLGDT I AM ECLAKGTPAP 1980 

30 QISWIFPDRR VWQTVSPVES R I TLHENRTL SIKEASFSDR GVYKCVASNA AGADSLAIRL 2 040 

HVAALPPVIH QEKLENISLP PGLSIHIHCT AKAAPLPSVR WVLGDGTQIR PSQFLHGNLF 2100 

VFPNGTLYIR NLAPKDSGRY ECVAANLVGS ARRTVQLNVQ RAAANARITG TSPRRTDVRY 2160 

GGTLKLDCSA SGDPWPRIIjW RLPSKRMIDA LFSFDSRIKV FANGTLWKS VTDKDAGDYL 222 0 

CVARNKVGDD YWLKVDWM KPAKIEHKEE NDHKVFYGGD LKVDCVATGL PNPEISWSLP 22 80 

35 DGSLVNSFMQ SDDSGGRTKR YWFNNGTLY FNEVGMREEG DYTCFAENQV GKDEMRVRVK 2340 

WTAPATIRN KTYLAVQVPY GDWTVACEA KGEPMPKVTW LSPTNKVIPT SSEKYQIYQD 2400 

GTLLIQKAQR SDSGNYTCLV RNSAGEDRKT WIHVNVQPP KINGNPNPIT TVREIAAGGS 2460 

RKLIDCKAEG IPTPRVLWAF PEGWIiPAPY YGNRITVHGN GSLDIRSLRK SDSVQLVCMA 252 0 

RNEGGEARL I VQLTVLEPME KPIFHDPISE K I TAMAGHT I SLNCSAAGTP TPSLVWVLPN 2580 

40 GTDLQSGQQL QRFYHKADGM LHISGLSSVD AGAYRCVARN AAGHTERLVS LKVGLKPEAN 2640 

KQYHNLVS I I NGETLKLPCT PPGAGQGRFS WTLPNGMHLE GPQTLGRVSL LDNGTLTVRE 2700 

ASVFDRGTYV CRMETEYGPS VTSIPVIVIA YPPRITSEPT PVIYTRPGNT VKLNCMAMGI 2760 

PKADITWELP DKSHLKAGVQ ARLYGNRFLH PQGSLTIQHA TQRDAGFYKC MAKNILGSDS 2 820 
KTTYIHVF 

45 
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ATGCCAGGCA CAAAACTAAC CCGAACAGGC GCCCCAGCAG ACTACAGAGT GATATTGAAG 60 

ACCT CTCAAG AGGACGAATT GGATGTACCT GACGACATCA GCGTCCGGGT TATGTCATCT 12 0 

CAGTCTGTGC TTGTGTCCTG GGTGGATCCT GTTCTGGAAA AACAGAAGAA AGTTGTTGCA 180 

55 TCAAGACAGT ACACCGTGCG CTATCGAGAG AAGGGGGAAT TGGCCAGGTG GGATTATAAG 240 

CAGATCGCTA ACAGGCGTGT GCTGATTGAG AACCTGATTC CAGACACTGT GTATGAATTT 3 00 

GCAGTCCGTA TTTCACAGGG TGAAAGAGAT GGCAAATGGA GTACGTCAGT CTTCCAAAGA 360 

ACACCAGAAT CTGCCCCTAC CACAGCTCCT GAAAACTTGA ACGTCTGGCC AGTCAATGGC 420 

AAACCTACAG TTGTCGCTGC ATCTTGGGAT GCGCTACCAG AGACTGAGGG GAAAGTGAAA 480 

60 GTCTGTCTGC TGGACACAGG ACTGTTTTCA GTTTCCTCCT TCCAACCATC TGCCAAATCA 540 

TT TCAGAAT A CATTCTTTCA TACGCCCCGG CTCTCAAACC ATTTGGAGCA AAGTCCCTCA 600 

CCTATCCTGG AGACACTACT TCTGCCCTGG TGGATGGTCT GCAGCCTGGG GAACGCT AT C 660 

TTTTCAAAAT CCGGGCCACA AACAGGAGAG GCCTGGGACC TCACTCCAAA GCCTTCATTG 720 

TCGCTATGCC AACAAGAATG CAGCTGTACC CAGAAGGATT TCAGTTGTCT AGCTTACCTG 780 

65 ATCGATATCC AAACCAAACA AGTTAATAAA GATCCACAAC TGGAAGGGAG TGTTTTTGGA 840 

CCATGTTTTC TTTTCTACTT CCTCACATTT ATGCTGGATA TTGGCGGCTT TTCCTTCATT 900 

ATGTGCTATG AAGACCCANN TGTTTCTTCT TTGACAGGCA ATTCTTTAAA ATCTGTTGCA 960 

GCCAGTAAGG CGGATGTTCA GCAGAACACG GAGGACAATG GGAAACCCGA AAAACCTGAG 102 0 

CCTTCCTCAC CTTCTCCCAG AGCTCCAGCT TCCTCCCAAC ACCCCTCTGT GCCTGCTTCT 1080 

70 CCCCAAGGGA GAAATGCCAA GGACCTTCTT CTTGACTTGA AGAACAAAAT ATTGGCTAAT 1140 

GGTGGGGCGC CCCGAAAACC CCAGCTTCGC GCCAAGAAGG CAGAGGAGCT GGATCTTCAG 1200 

TCGACAGAAA TCACTGGGGA GGAGGAGCTG GGTTCCCGGG AGGACTCGCC CATGTCACCC 1260 

TCAGACACCC AAGACCAGAA ACGGACCCTG AGGCCGCCAA GTAGACACGG CCACTCGGTG 132 0 

GTTGCTCCCG GCAGGACTGC AGTGAGGGCC CGGATGCCAG CGCTGCCCCG AAGGGAAGGC 13 8 0 

75 GTAGATAAGC CTGGCTTTTC CCTGGCCACG CAGCCCCGCC CAGGGGCGCC CCCCTCGGCT 1440 

TCGGCCTCTC CTGCCCACCA CGCGTCCACC CAGGGCACCT CTCATCGTCC TTCCCTGCCT 1500 

GCCAGCTTGA ATGACAACGA CTTGGTGGAC TCAGACGAAG ATGAGCGCGC TGTGGGCTCC 1560 

CTCCACCCCA AGGGCGCCTT CGCCCAGCCC CGGCCAGCCC TGTCCCCCAG CCGCCAGTCC 1620 

CCGTCCAGCG TTCTCCGCGA CAGAAGCTCT GTGCACCCCG GCGCAAAGCC AGCCTCGCCG 1680 

80 GCGCGGAGGA CCCCCCATTC AGGGGCCGCA GAGGAAGATT CCAGTGCCTC AGCCCCACCC 1740 

TCAAGACTTT CTCCACCCCA TGGGGGATCA TCTCGGCTGC TGCCCACCCA GCCACACCTG 1800 

AGCTCTCCAC TTTCCAAGGG CGGGAAGGAT GGTGAGGACG CCCCAGCCAC CAACTCCAAT 1860 

GCGCCATCAC GGTCCACCAT GTCCTCCTCC GTCTCTTCTC ATCTCTCGTC CAGGACGCAG 1920 

GTCTCTGAGG GAGCGGAGGC TTCTGATGGT GAAAGCCACG GTGACGG CGA TAGGGAAGAC 1980 

85 GGCGGAAGGC AGGCGGAGGC CACGGCCCAG ACGCTGCGGG CCCGGCCTGC CTCTGGACAC 2040 

TTCCATTTGC TCAGACACAA ACCCTTTGCT GCCAACGGGA GGTCTCCAAG CAGGTTCAGC 2100 

ATTGGGCGGG GACCTCGGCT GCAGCCCTCC AGCTCCCCAC AGTCGACTGT GCCCTCCCGA 2160 
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GCCCACCCCA GGGTTCCCTC T C ACT CTGAT TCCCACCCTA AGCTTAGCTC AGGTATCCAT 222 0 

GGAGACGAGG AGGATGAGAA GCCGCTTCCT GCCACCGTTG TCAATGACCA CGTGCCTTCC 2280 

TCCTCCAGGC AGCCCATCTC CCGGGGCTGG GAGGACTTAA GGAGAAGCCC GCAGAGAGGG 2340 

GCCAGCCTGC ATCGGAAGGA ACCCATCCCA GAGAACCCCA AATCCACAGG GGCAGATACA 2400 

5 CATCCTCAGG GCAAGTACTC CTCCCTGGCC TCCAAGGCTC AGGATGTTCA ACAGAGCACA 2460 

GACGCGGACA CGGAGGGTCA TTCTCCCAAA GCACAGCCAG GGTCCACAGA CCGCCACGCG 252 0 

TCCCCTGCTC GTCCTCCCGC AGCACGGTCA CAGCAGCATC CCAGTGTTCC CAGAAGGATG 2580 

ACACCCGGCC GGGCCCCAGA ACAGCAGCCC CCTCCTCCCG TCGCCACGTC CCAGCACCAC 2640 

CCGGGACCCC AGAGCAGAGA CGCGGGTCGG TCACCTTCCC AGCCCAGGCT CTCACTGACC 2700 

10 CAGGCCGGGC GGCCCCGCCC CACGTCGCAG GGCCGCTCCC ACTCCTCCTC GGACCCTTAC 2760 

ACGGCGAGCT CCAGAGGGAT GCTCCCCACG GCCCTCCAGA ACCAGGACGA GGATGCCCAG 2820 

GGCAGCTACG ACGACGACAG CACAGAAGTC GAGGCCCAGG ATGTGCGGGC CCCCGCGCAC 2880 

GCCGCGCGCG CCAAGGAGGC AGCTGCGTCC CTTCCCAAGC ACCAGCAGGT GGAGTCTCCC 2940 

ACAGGCGCAG GGGCAGGTGG CGACCACAGG TCCCAGCGCG GACATGCGGC CTCCCCCGCC 3000 

15 AGGCCCAGCC GACCCGGCGG CCCCCAGTCC CGCGCCCGGG TCCCCAGCAG GGCAGCGCCG 3060 

GGGAAGTCGG AGCCTCCTTC CAAGCGGCCC CTGTCCTCCA AGTCCCAGCA GTCGGTCTCA 3120 

GCCGAGGACG AGGAGGAGGA GGACGCGGGG TTTTTTAAAG GCGGGAAAGA AGACCTTCTG 3180 

TCTTCCTCTG TGCCAAAGTG GCCCTCTTCC TCCACTCCCA GGGGCGG CAA AGACGCCGAT 3240 

GGGAGCCTCG CCAAGGAAGA GAGGGAGCCT GCCATCGCGC TTGCCCCTCG CGGAGGGAGC 3300 

20 CTGGCTCCTG TGAAGCGACC TCTCCCCCCA CCTCCAGGCA GCTCCCCCAG GGCCTCCCAC 33 60 

GTCCCTTCCC GACCGCCGCC TCGCAGCGCT GCCACCGTGA GCCCCGTCGG GGGCACCCAC 3420 

CCCTGGCCGC GGTACACCAC GCGCGCCCCV CCTGGCCACT TCTCCACCAC CCCGATGCTG 3480 

TCCTTGCGCC AGAGGATGAT GCATGCCAGA TTCCGTAACC CTCTCTCCCG ACAGCCTGCG 3540 

AGACCCTCTT ACAGACAAGG TTATAATGGC AGACCAAATG TAGAAGGGAA AGTCCTTCCT 3600 

25 GGTAGTAATG GAAAACCGAA TGGACAGAGA ATTATCAATG GCCCTCAAGG AACAAAGTGG 3 660 

GTTGTGGACC TTGATCGTGG GTTAGTATTG AATGCAGAAG GAAGGTACCT CC AAGATT C A 372 0 

CATGGAAATC CTCTTCGGAT TAAACTAGGA GGAGATGGTC GAACCATTGT AGATCTGGAA 3780 

GGGACCCCCG TGGTGAGTCC TGACGGCCTC CCACTCTTTG GGCAGGGGCG ACATGGCACA 3840 

CCTCTGGCCA ATGCCCAAGA TAAGCCAATT TTGAGTCTTG GAGGAAAGCC GCTGGTGGGC 3 900 

30 TTGGAGGTCA TCAAAAAAAC CACCCATCCC CCTACCACTA CCATGCAGCC CACCACTACT 3960 

ACGACGCCCC TGCCTACCAC TACAACCCCG AGGCCCACCA CTGCCACCAC CATGCAGCCC 402 0 

ACCACTACTA CGACGCCCCT GCCTACCACT ACACCGAGGC CCACCACTGC CACCACCCGC 40 80 

CGCACGACCA CCAGGCGTCC AACAACCACA GTCCGAACCA CTACGCGGAC AACCACCACC 4140 

ACCACCCCCA AACCCACCAC TCCCATCCCC ACCTGTCCCC CTGGGACCTT GGAACGGCAC 420 0 

35 GACGATGATG GCAACCTGAT AATGAGCTCC AATGGGATCC CAGAGTGCTA CGCTGAAGAA 42 60 

GATGAGTTCT CAGGCTTGGA GACTGACACT GCAGTACCTA CGGAAGAGGC CTACGTTATA 432 0 

TATGATGAAG ATTATGAATT TGAGACGTCA AGGCCACCAA CCACCACTGA GCCTTCGACC 4380 

ACTGCTACCA CACCGAGGGT GATCCCAGAG GAAGGCGCCA TCAGTTCCTT TCCTGAAGAA 4440 

GAATTTGATC TGGCTGGAAG GAAACGATTT GTTGCTCCTT ACGTGACGTA CCTAAATAAA 4500 

40 GACCCATCAG CCCCGTGCTC TCTGACTGAT GCACTGGATC ACTTCCAAGT GGACAGCCTG 4560 

GATGAAATCA TCCCCAATGA CCTGAAGAAG AGTGATCTGC CTCCCCAGCA TGCTCCCCGC 462 0 

AACATCACCG TGGTGGCCGT GGAAGGTTGC CACTCATTTG TCATTGTGGA TTGGGACAAA 4680 

GCCACCCCAG GAGATTTGGT CACAGGTTAT TTGGTTTACA GTGCATCCTA TGAAGATTTC 4740 

ATCAGGAACA AGTTTTCCAC TCAAGCTTCA TCAGTAACTC ACTTGCCCAT TGAGAACCTA 4800 

45 AAGCCCAACA CGAGGTATTA TTTTAAAGTG CAAGCACAAA ATCCTCATGG CTACGGACCT 4860 

ATCAGCCCTT CGGTCTCATT TGTCACCGAA TCAGATAATC CTCTGCTTGT TGTGAGGCCC 4920 

CCAGGCGGTG AGCTATCTGG ATCCCATTCG CTTTCAAACA TGATCCCAGC TACACGGACT 4 980 

GCCATGGACG GCAATATGTG AAGCGCACGT GGTATCGAAA GTTCGTGGGA GTTGTTCTTT 5040 

GTAATTCACT GAGGTATAAA ATCTACCTCA GTGACAACCT GAAAGATACA TTCTACAGCA 510 0 

50 TTGGAGACAG CTGGGGAAGA GGTGAAGACC ATTGCCAATT TGTGGATTCA CACCTTGATG 5160 

GAAGAACAGG GCCTCAGTCC TATGTAGAAG CCCTCCCTAC TATTCAAGGC TACTATCGCC 5220 

AGT AT CGTC A GGAGCCTGTC AGGTTTGGGA ACATCGGCTT CGGAACCCCC TACTACTATG 5280 

TGGGCTGGTA CGAGTGTGGG GTCTCCATCC CTGGAAAGTG GTAATCACAG GACCGTCATG 5340 

CTGCAAGCTT GCCCTGCCCA GCCCCACCAA CTAAGTCGCA CTAGGGGCTG TGAGCAAAGA 5400 

55 CAGCCAGCAT GCTCAGCCCC GCTGCCCTAG GTGCCAGGAA GGTCACAGAT GGACACTGGC 5460 

CATTCTGGTC ATCTCAGTCT GGAACTCAGT CCCACTTCTT GGCCTGGACA ATGAACAGGA 5520 

TTCAGTTTTG CTGTTAACTT TGCTTCTCTA CTTTTTTTTG TTTGTTTGTA ATAGCACATC 5580 

CCAGAGACAT CAGAAACCAG CAACTGATTC AGTGTGATTT CCCAGACTTT TTAGGCATGA 5640 

AATTCGGACA CTTCAGTATT TCCAGGAATA GCATATGCAC GCTGTTCTTG CTTCATGGAA 57 0 0 

60 "TGCTACATGC TTTCTGTTTT TCTCATTTTG GATTTCTCCA AAACTAACTG AATTTAAGCT 5760 

TCAGGTCCCT TTGTATG CAG TAGAAAGGAA TTATTAAAAA CACCACCAAA GAAAATAAAT 5820 

ATATCCTACT TGAAATTTAC TCTATGGACT TACCCACTGG TAGAATAAAT GTATCAAATC 5880 

TTATTTGTAA ATTCTCAATT TTGATATATA TATGTATATA TGCATATACA TATCCACACT 5 940 

TGT CTGCAAG AATATTGATT AAAATTGCTA AATTTGTACT TGTTCACCAA AAAAAAAAAA 6000 
65 AAAAAAA 

Seq ID NO: 419 Protein sequence 
Protein Accession #: Eos sequence 

70 1 11 21 31 41 51 

I I I I I I 

MPGTKLTRTG APADYRVILK TSQEDELDVP DDISVRVMSS QSVLVSWVDP VLEKQKKWA 60 

SRQYTVRYRE KGELARWDYK QIANRRVLIE NL I PDTVYEF AVRISQGERD GKWSTSVFQR 12 0 

TPESAPTTAP ENLNVWPVNG KPTWAASWD ALP ETEGKVK VCLLDTGIjFS VSSFQPSAKS 180 

75 FQNTFFHTPR LSNHLEQSPS PILETLLLPW WMVCSLGNAI FSKSGPQTGE AWDLTPKPSL 240 

SLCQQECSCT QKDFSCLAYL IDIQTKQVNK DPQLEGSVFG PCFLFYFLTF MLDIGGFSFI 300 

MCYEDPVSSL TGNS LKS VAA SKADVQQNTE DNGKPEKPEP SSPSPRAPAS SQHPSVPASP 3 60 

QGRNAKDLLL DLKNKILANG GAPRKPQLRA KKAEELDLQS TEITGEEELG SREDSPMSPS 420 

DTQDQKRTLR PPSRHGHSW APGRTAVRAR MPALPRREGV DKPGFSLATQ PRPGAPPSAS 480 

80 ASPAHHASTQ GTSHRPSLPA SLNDNDLVDS DEDERAVGSL HPKGAFAQPR PALSPSRQSP 540 

SSVLRDRSSV HPGAKPASPA RRTPHSGAAE EDSSASAPPS RLSPPHGGSS RLLPTQPHLS 600 

SPLSKGGKDG EDAPATNSNA PSRSTMSSSV SSHLSSRTQV SEGAEASDGE SHGDGDREDG 660 

GRQAEATAQT LRARPASGHF HLLRHKPFAA NGRSPSRFSI GRGPRLQPSS SPQSTVPSRA 72 0 

HPRVPSHSDS HPKLSSGIHG DEEDEKPLPA TWNDHVPSS SRQPISRGWE DLRRSPQRGA 780 

85 SLHRKEPIPE NPKSTGADTH PQGKYSSLAS KAQDVQQSTD ADTEGHSPKA QPGSTDRHAS 840 

PARPPAARSQ QHPSVPRRMT PGRAPEQQPP PPVATSQHHP GPQSRDAGRS PSQPRLSLTQ 900 

AGRPRPTSQG RSHSSSDPYT ASSRGMLiPTA LQNQDEDAQG SYDDDSTEVE AQDVRAPAHA 960 



342 



WO 02/086443 



PCT/US02/12476 



10 



ARAKEAAASL 
KSEPPSKRPL 
SLAKEEREPA 
WPRYTTRAPP 
SNGKPNGQRI 
TPWSPDGLP 
TPLPTTTTPR 
TPKPTTPIPT 
DEDYEFETSR 
PSAPCSLTDA 
TPGDLVTGYL 
SPSVSFVTES 



PKHQQVESPT 
SSKSQQSVSA 
IALAPRGGSL 
GHFSTTPMLS 
INGPQGTKWV 
LFGQGRHGTP 
PTTATTMQPT 
CPPGTLERHD 
PPTTTEPSTT 
LDHFQVDSIiD 
VYSASYEDFI 
DNPLLWRPP 



GAGAGGDHRS 
EDEEEEDAGF 
APVKRPLPPP 
LRQRMMHARF 
VDLDRGLVLN 
LANAQDKPIL. 
TTTTPLPTTT 
DDGNLIMSSN 
ATTPRVI PEE 
EIIPNDLKKS 
RNKFSTQASS 
GGELSGSHSL 



QRGHAASPAR 
FKGGKEDLLS 
PGSSPRASHV 
RNPLSRQPAR 
AEGRYLQDSH 
SLGGKPLVGL 
PRPTTATTRR 
GIPECYAEED 
GAISSFPEEE 
DLPPQHAPRN 
VTHLPIENLK 
SNMIPATRTA 



PSRPGGPQSR 
SSVPKWPSSS 
PSRPPPRSAA 
PSYRQGYNGR 
GNPLRIKLGG 
EVIKKTTHPP 
TTTRRPTTTV 
EFSGLETDTA 
FDLAGRKRFV 
I TWAVEGCH 
PNTRYYFKVQ 
MDGNM 



ARVPSRAAPG 1020 

TPRGGKDADG 10 80 

TVSPVAGTHP 1140 

PNVEGKVLPG 1200 

DGRTIVDLEG 1260 

TTTMQPTTTT 1320 

RTTTRTTTTT 1380 

VPTEEAYVIY 1440 

APYVTYLNKD 1500 

SFVIVDWDKA 1560 

AQNPHGYGPI 1620 



15 



Seq ID NO: 420 DNA sequence 

Nucleic Acid Accession #: NM_022743 

Coding sequence: 128.. 1237 



20 



25 



30 



35 



40 



45 



50 



55 



GTGGATTTTA 
TCTCTGCTGC 
AAAGCTGATG 
AAAAGCTTGG 
TCCTCCAGAC 
TTCAGAATCA 
TGAAGATAAG 
AGAAATACAG 
AGTGATCTGC 
AT AT CCCAGT 
TGGGCCCCAC 
CTGCTACCTG 
CTGCTTTGAA 
TGGTGATGAG 
GGCACACTGG 
TGAACGGCTT 
CTG CAT CAAC 
ATACAGGATT 
CAAACTGCAG 
TGATATTATG 
TTTAGAAGAA 
CGGCGTGTGT 
GTGAACCTCT 
GGTTTGCAAA 
ATTTGGTTGA 



11 
I 

GAGATACCTC 
AACACCCCTA 
CGATGCTCTC 
CCAGACCACA 
TCCGTTCGAC 
GAGAAGCTTT 
AAAGAGGGCC 
GATGCCTCTC 
AACTCTTTCA 
ATCTCTTTGC 
CTCTTACTGC 
GAT ATG CTG A 
TGTGACTGTT 
CAAGTATGGA 
AAGTGGGAGC 
CCCGATATCA 
CTCGGCCTGT 
TTTTTCCCAG 
CTACATCAAG 
AGAGTGACAC 
TGCGACGCCA 
CTTTGTTGAA 
CTTATTGGAA 
CCACAAGAAT 
GGATGCCAAA 



21 

I 

CCCTCCTTCT 
CTGTTCTCCG 
AGTGCCGCGT 
AGCGGGAATG 
TTCTTGGCAG 
ACTCATTTTA 
TCAGGCAACT 
AGCTGCCACC 
CCATCTGTAA 
TCAATCACAG 
GAGCAGTCCG 
TGACCAGTGA 
TCCGTTGCCA 
AGGAAGTTCA 
AGGTTCTGGC 
ACATCTACCA 
TGGAGGAAGC 
GAAGCCATCC 
GCATGTTTCC 
ATGGCAGAGA 
ACATCAGAGC 
TGCCTTATTG 
ATTCTGTTCC 
CATTAGTTGT 
AAAAAAAAAA 



31 
I 

GCTCAGCTGC 
TGTATTGGCT 
CGCCAAATAC 
CAAATGCCTT 
AGTTGTCTTC 
TGATCTGGAG 
CGTAATGACA 
TGCCTTTGAC 
TGCGGAGATG 
CTGTGACCCC 
AGACATCGAG 
GGAGCGCCGG 
AACCCAGGAC 
AGAAT CCCTG 
CATGTGCCAG 
GCTGAAGGTG 
CTTGTTCTAT 
CGTCAGAGGG 
CCAAGCAATG 
ACACAGCCTG 
ATCCTAAGGG 
AGGTCACACA 
' GTGTTTGTGT 
AGAGAAGCAC 
AAAAAAA 



41 

i 

CTTGCAGTAA 
TTTCTGGGCA 
TGTAGTGCTA 
AAAAGCTGCA 
AAACTTATGG 
TCAAATATTA 
TTTCAACATT 
CTTTTTGAAG 
CAGGAAGTTG 
AACTGTTCGA 
GTGGGAGAGG 
AAGCAGCTGA 
AAGGATGCTG 
AAAAAAATTG 
GCGATCATAA 
CTCGACTGCG 
GGTACTCGGA 
GTTCAAGTGA 
AAGAAT CTGA 
ATTGAAGATT 
AACGCAGTCA 
CTCTATGCTT 
AGGTAAATAA 
GATTATAATA 



51 
I 

TTAAACTCTT 
GCAGGAAGGA 
AGTGT CAGAA 
AACCCAGATA 
ATGGAGCACC 
ACAAACTGAC 
TCATGAGAGA 
CCTTTGCAAA 
GTGTTGGCCT 
TTGTGTTCAA 
AGCTCACCAT 
GGGACCAGTA 
ATATGCTAAC 
AAGAACTGAA 
GCAGCAATTC 
CCATGGATGC 
CCATGGAGCC 
TGAAAGTTGG 
GACTGGCTTT 
TGATTCTACT 
GAGGGAAATA 
TGTTAGCTGT 
AGGCAGACAT 
AATTCAAAAC 



Seq ID NO: 421 Protein sequence 
Protein Accession #: NP 073580 



MRCSQCRVAK 
SEKLYSFYDL 
CNSFTI CNAE 
LDMLMTSEER 
WKWEQVLAMC 
IFFPGSHPVR 
ECDANIRAS 



11 

I 

YCSAKCQKKA 
ESNINKLTED 
MQEVGVGLYP 
RKQLRDQYCF 
QAIISSNSER 
GVQVMKVGKL 



21 



WPDHKRECKC 
KKEGLRQLVM 
SISLLNHSCD 
ECDCFRCQTQ 
LPDINIYQLK 
QLHQGMFPQA 



31 
I 

LKSCKPRYPP 
TFQHFMREEI 
PNCSIVFNGP 
DKDADMLTGD 
VLDCAMDACI 
MKNLRLAFDI 



41 

I 

DSVRLLGRW 
QDASQLPPAF 
HLLLRAVRDI 
EQVWKEVQES 
NLGLLEEALF 
MRVTHGREHS 



51 
I 

F KLMD GAP S E 
DLFEAFAKVI 
EVGEELTICY 
LKKIEELKAH 
YGTRTMEPYR 
IiIEDLIIiLIiE 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 



60 
120 
180 
240 
300 
360 



60 



Seq ID NO: 422 DNA sequence 

Nucleic Acid Accession #t NM_003014.2 

Coding sequence: 238.. 648 



65 



70 



75 



80 



85 



GGCGGGTTCG 
CGGAGCTCCG 
AAACTCTCCT 
GGCAGGAAGA 
TTCCTCTCCA 
GCGCCCTGCG 
ATGCCCAACC 
GAGGAGCTGG 
GCGCCCATTT 
CAACGCGCGC 
AGCCTGGCCT 
ATCGTCACGG 
CAGGAAAGGC 
AAGGTGAAGC 
AAAATAAAAG 
GAGAT CTTCA 
TCTTGCCAGT 
CGTTCAAGGA 
AAAAGATCCA 
AAGAAAACAG 
GCTCCCAAAC 
. AACCCGAAAA 
' GATGAGGCTG 



11 
I 

CGCCCCGAAG 
CGGCCGGACC 
GCGCCCCAGA 
GAAGGCGCTT 
TCCTAGTGGC 
AGGCGGTGCG 
ACCTGCACCA 
TGGACGTGAA 
GCACCCTGGA 
GCGACGACTG 
GCGACGAGCT 
ACCTCCCGGA 
CTCTTGATGT 
CAACTTTGGC 
CTGTGCAGAG 
AGTCCTCATC 
GTCCACACAT 
TGATGCTTCT 
TACAGTGGGA 
CCGGGCGCAC 
CAGCCAGTCC 
GAGTGTGAGC 
GGCATTGCCT 



21 



GCTGAGAGCT 
CCGCGGCCCC 
AGATTTCTTC 
TCTGTCTGCC 
GCTGTGCCTG 
CATCCCTATG 
CAGCACGCAG 
CTGCAGCGCC 
GTTCCTGCAC 
CGAGCCCCTC 
GCCTGTCTAT 
GGATGTTAAG 
TGACTGTAAA 
AACGTATCTC 
GAGTGGCTGC 
ACCCATCCCT 
CCTGCCCCAT 
TGAAAATTGC 
AGAGAGGCTG 
CAGT CGTAGT 
CAAGAAGAAC 
TAACTAGTTT 
GGGACAGCCT 



31 
1 

GGCGCTGCTC 
GCTTTGCTGC 
CTCGGCGAAG 
GGGGTCGCAG 
TGGCTGCACC 
TGCCGGCACA 
GAGAACGCCA 
GTGCTGCGCT 
GACCCTATCA 
ATGAAGATGT 
GACCGTGGCG 
TGGATAGACA 
CGCCTAAGCC 
AGCAAAAACT 
AATGAGGTCA 
CGAACT CAAG 
CAAGATGTTC 
TTAGTTGAAA 
CAGGAACAGC 
AATCCCCCCA 
ATTAAAACTA 
CCAAAGCGGA 
ATGTAAGGCC 



41 

1 

GTGCCCTGTG 
CGACTGGAGT 
GGACAGCGAA 
CGCGAGAGGG 
TGGCGCTGGG 
TGCCCTGGAA 
TCCTGGCCAT 
TCTTCTTCTG 
AGCCGTGCAA 
ACAACCACAG 
TGTGCATTTC 
TCACACCAGA 
CCGATCGGTG 
ACAGCTATGT 
CAACGGTGGT 
TCCCGCTCAT 
TCATCATGTG 
AATGGAGAGA 
GGAGAACAGT 
AACCAAAGGG 
GGAGTGCCCA 
GACTTCCGAC 
ATGTGCCCCT 



51 

1 

TGCCAGACGG 60 

TTGGGGGAAG 120 

AGATGAGGGT 180 

CAGTGCCATG 24 0 

CGTGCGCGGC 300 

CATCACGCGG 360 

CGAG CAGT AC 420 

TGCCATGTAC 480 

GTCGGTGTGC 54 0 

CTGG CCCGAA 600 

GCCTGAAGCC 660 

CATGATGGTA 720 

CAAGTGTAAA 780 

TATTCATGCC 840 

GGATGTAAAA 900 

TACAAATTCT 960 

TTACGAGTGG 1020 

TCAGCTTAGT 1080 

TCAGGACAAG 1140 

AAAGCCTCCT 1200 

GAAGAG AACA 12 60 

TTCCTTACAG 1320 

TGCCCTAACA 1380 



343 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



WO 02/086443 

ACTCACTGCA GTGCTCTTCA 
GTTTTTCTTT GTAAGCCATC 
GAGTTAAAGC TGGTGGAAAA 
CTAGAAGAGT AGGGAAAATA 
AAATGCCATA TTTCAAACAA 
TATCTGTTGT TGCAATGTTA 
AAGGAACAGT AGTGGAATGA 
TTTTTGTGAT GAAAGGGGAT 
TGTGTTTTTT TACCAATGAC 
AATAATAAAG AAAAATAAAT 
GTTACCTGAT TTCCATGATC 
ACAGTGAGTT TGTCTGTACC 
ATTTTATACC CACAAGAGAG 
AATAATTTGA CAAGCTTAAA 
TTAAATATTT TCTTTGCCTA 
AAAGTTGAGT TCCACCTCTG 
AAAAAGAACT TATTTGCAGC 
ATTTATTTTA AAAAACAATT 
AGGCATTCAA TAAATGCACA 
ACTACACAGA GGTAATCACT 
GCACTTATAA AATGATTTGA 
CTGCCTCCTT TGCTTGGCCC 
TCTCATTTCT AACAGCTGTG 
TATTGGATAC TTAGGTGGTT 



PCT/US02/12476 



TAGACACATC 
ACAAGCCATA 
GGCTTATTGC 
ATGCTTGTTA 
AACACGTAAT 
GTGATGTTTT 
ATGTTAAAAG 
TTTTTGAAAA 
TTCAGTTTCT 
AAAAAGGAGA 
ATGATGCTTC 
ATTAGGAGTT 
GTATGTCACT 
AATGGCCTTC 
AATACATGTG 
AAATGAGAAT 
ATTTTATCAA 
TTATTGGCCT 
ACGCCCAAAG 
ATTAGTATTT 
ACAAATAAAA 
TTTATTGAGA 
TTATATTCCA 
TCTTCACTGA 



TTGCAGCATT 
GTGGTAGGTT 
ATTGCATTCA 
CAATTCGACC 
TTTTTTACAG 
AAAATGTGAT 
ATCTTTATGT 
ATTAGAGAAG 
GTTTTTAGCT 
GGCAGACAAT 
TTGTCAACAC 
AGGTACTAAT 
CATCTTACTT 
ATGTGAGTGC 
AGAGGAGTTA 
TACTTGACAG 
CAAATTTCAT 
TTTGCTAACA 
GAAATAAAAT 
TGGCATATTA 
CTAGGAACCT 
TAAGTTTTCC 
TAGTATGCAT 
CAATACTGAA 



TTT CTTAAGG 
TGCCCTTTGG 
GAGTAACCTG 
TAATATGTGC 
TATGTTTTAT 
GAAAATATAA 
GTTTATGGTC 
TAGCATATGG 
AGAAACTTAA 
GTCTGGATTC 
CCTCTTAAGC 
TAGTTGGCTA 
CCCAGGACAT 
CAAATTTTGT 
AATATAAATG 
TTGGGATACT 
AATTGTGGAC 
CAGTAAGCAT 
CCTATCTAAT 
TTCTCCAGGT 
GTATACATGT 
TGTCAAGAAA 
TACTCAACAA 
TAAACATCTC 



Seq ID NO: 423 Protein sequence 
Protein Accession ft: NP 003005.1 



11 



21 



MFLSILVALC 
YEELVDVNCS 
ESLACDELPV 
KKVKPTLATY 
SSCQCPHILP 
KKKTAGRTSR 



LWLHLALGVR 
AVLRFFFCAM 
YDRGVCISPE 
LSKNYSYVIH 
HQDVLIMCYE 
SNPPKPKGKP 



GAPCEAVRIP 
YAPICTLEFL 
AIVTDLPEDV 
AKIKAVQRSG 
WRSRMMLLEN 
PAPKPASPKK 



31 
I 

MCRHMPWNIT 
HDPIKPCKSV 
KWIDITPDMM 
CNEVTTWDV 
CLVEKWRDQIi 
NIKTRSAQKR 



41 



RMPNHLHHST 
CQRARDDCEP 
VQERPLDVDC 
KEIFKSSSPI 
SKRSIQWEER 
TNPKRV 



Seq ID NO: 424 DNA sequence 
Nucleic Acid Accession #: BC010423 
Coding sequence: 248.. 1780 



85 



CACAGCGTGG 

AGCTACGGCT 

CAAGTGCGAG 

TCTGCAGCCG 

TTCAACCATG 

GCTGCTACTG 

CGTGGTAACT 

CGGCGAGCAA 

ACTAGCGCTA 

GGAGCAGCCG 

GCAGGCGGAT 

GGCGCGGCTG 

ACTAGAAGAG 

CCCCAGCGTG 

CTCCCGCTCT 

GCAGCCACTG 

CATCCTCCAC 

GTGGCACATT 

CTCATACAAC 

CACTTTGGGC 

CAATGAGTTC 

CTCTGGGAAG 

ACTCTTGTTC 

GGCCCAGCAG 

CCGGAGGCTG 

GAGAGCCGAG 

AGAGCCCGAG 

TGAACTGCTG 

CAAACAGGCC 

CAATGGCATC 

CTAGGCCTGG 

ACACCCCCAT 

AACCCTTCTG 

CACTGTGTGT 

TGACTGTCCG 

AAGT G AACTG 

GTTTGGCGTG 

CAGACCCCAG 

CAGACCCAGG 

TCTCCTACCA 

GAGGCTTGAA 

ACATATTTTC 

ACTTTTAATT 

TTTTATTTTT 



11 
I 

GAAGCAGCTC 
GGGTGTGTAG 
AGGCAAGAAC 
GCTCCCAGGG 
CCCCTGTCCC 
CTGGCATCAT 
GTGGTGCTGG 
GTGGGGCAAG 
CTGCACTCCA 
CCGCCCCCAC 
GAGGG CGAGT 
CGGCTCCGAG 
GGCCAGGGCC 
ACCTGGGACA 
GCTGCCGTCA 
ACTTGTGTGG 
GTGTCCTTCC 
GGCAGAGAAG 
TGGACACGGC 
TTTCCCCCAC 
TCCTCAAGGG 
CAGGTGGACC 
TGCCTTCTGG 
ATGACCCAGA 
CATTCCCATC 
GGCCACCCTG 
GGCCGCAGTT 
TCTCCAGGCT 
ATGAACCATT 
TACAT CAATG 
CTCCTTCTGT 
TTCTTGCGGA 
TTCATCGGGA 
GTGCATGTGT 
TGGAGGGGTG 
TGGTGTATGT 
TGTGT CATGT 
AGCAGTATTA 
TGTGCGGGCA 
CTTCGGAGCC 
CTGTTACAGA 
TGTAAATATA 
TTTTTCTTTT 
ATTTTTTTTT 



21 
I 

TGGGGGAGCT 
AACGGGGCCG 
TCTGCAGCTT 
AGATCTCGGT 
TGGGAGCCGA 
TTACAGGCCG 
GCCAGGACGC 
TGGCATGGGC 
AATACGGGCT 
GCAACCCCCT 
ACGAGTGCCG 
TGCTGGTGCC 
TGACCCTGGC 
CGGAGGTCAA 
CCT CAGAGTT 
TGTCCCATCC 
TTGCTGAGGC 
GAGCTATGCT 
TGGATGGGCC 
TGACCACTGA 
ATT CTCAGGT 
TAGTGTCAGC 
TGGTGGTGGT 
AATATGAGGA 
ACACGGACCC 
ATAGTCTCAA 
ACTCCACGCT 
CTGGGCGGGC 
TTGTTCAGGA 
GGCGGGGACA 
TGACATGGGA 
AGATGCTCCC 
GGGCTCCACC 
GCCTGTGTGA 
ACTGTGTCCG 
GCCACGGGAT 
GGCTGTGTGT 
ATGATGCAGA 
TAGCTGGAGC 
ATGGGGGCAA 
AGCCCTCTGC 
CATGCGCCGG 
TTTTTTCTTG 
AGAGTTTGAG 



31 
I 

CGGAGCTCCC 
GGGCTGGGGC 
CCTGCCTTCT 
GGAACTT CAG 
GATGTGGGGG 
GTGCCCCGCG 
AAAACTGCCC 
TCGGGTGGAC 
TCATGTGAGC 
GGACGGCTCA 
GGTCAGCACC 
TCCCCTGCCC 
AGCCTCCTGC 
AGGCACAACG 
CCACTTGGTG 
TGGCCTGCTC 
CTCtGTGAGG 
CAAGTGCCTG 
TCTGCCCAGT 
GCACAGCGGC 
CACTGTGGAT 
CTCGGTGGTG 
GGTGCTCATG 
GGAGCTGACC 
CAGGAGCCAG 
GGACAACAGT 
GACCACGGTG 
CGAGGAGGAG 
GAATGGGACC 
CCTGGTCTGA 
GATTTTAGCT 
CATCCCACTG 
AATTGAGTCT 
GTGTTGACTG 
TGGTGTGTAT 
TTGAGTGGTT 
GACCTCTGCC 
GGTTGGAGGA 
TGGAATCTGC 
GTGTGAAGCA 
CCTCTGGTGG 
GAGCTTCTTG 
CCCTTTCCAT 
TCCAGCCTGG 



41 
I 

GATCACGGCT 
TGGGTCCCCT 
GGGTCAGTTC 
AAACGCTGGG 
CCTGAGGCCT 
GGTGAGCTGG 
TGCTTCTACC 
GCGGGCGAAG 
CCGGCTTACG 
GTGCTCCTGC 
TTCCCCGCCG 
TCACTGAATC 
ACAGCTGAGG 
TCCAGCCGTT 
CCTAGCCGCA 
CAGGACCAAA 
GGCCTTGAAG 
AGTGAAGGGC 
GGGGTACGAG 
ATCTACGTCT 
GTTCTTGACC 
GTGGTGGGTG 
TCCCGATACC 
CTGACCAGGG 
CCGGAGGAGA 
AGCTGCTCTG 
AGGGAGATAG 
GAAGATCAGG 
CTACGGGCCA 
CCCAGGCCTG 
CATCTTGGGG 
ACTGCTTGAC 
CTCCCACCAT 
ACTGTGTGTG 
TATGCTGTCA 
GCGTGGGCAA 
TGAAAAAGCA 
GAGAGGTGGA 
CTCCGGTGTG 
GCCAGTCCCT 
CCTCTGGGCC 
CAGGAATACT 
TAGTTGTATT 
ACGATATAGC 



CTATGCTTCA 


1440 


TACAGAAGGT 


1500 


TGTGCATACT 


1560 


ATTGTAAAAT 


1620 


TACCTTTTGA 


1680 


TGTTTTTAAG 


1740 


TGCAGAAGGA 


1800 


AAAATTATAA 


1860 


AAACAAAAAT 


1920 


CTGTTTTTTG 


1980 


AGCACCAGAA 


2040 


ATGCTCAAGT 


2100 


CCACCCTGAG 


2160 


TTTTCTTCAT 


2220 


TACAGAGAGG 


2280 


TTAATCAGAA 


2340 


AATTGGAGGC 


2400 


GTATTTTATA 


2460 


CCTACTCTCC 


2520 


GTTTGCTTAT 


2580 


GTTTCATAAC 


2640 


GCAGAAACCA 


2700 


ACTGTTGTGC 


2760 


ACCGG AATTC 




51 


- 


1 

QENAILAIEQ 


60 


LMKMYNHSWP 


12 0 


KRLSPDRCKC 


180 


PRTQVPLITN 


240 


LQEQRRTVQD 


300 


51 

i 




1 

TCTTGGGGGT 


60 


AGTGGAGACC 


120 


CTTATTCAAG 


180 


CAGTCTGCCT 


240 


GGCTGCTGCT 


300 


AGACCTCAGA 


360 


GAGGGGACTC 


420 


GCGCCCAGGA 


480 


AGGGCCGCGT 


540 


GCAACGCAGT 


600 


GCAGCTTCCA 


660 


CTGGTCCAGC 


720 


GCAGCCCAGC 


780 


CCTTCAAGCA 


840 


GCATGAATGG 


900 


GGATCACCCA 


960 


ACCAAAATCT 


1020 


AGCCCCCTCC 


1080 


TGGATGGGGA 


1140 


GCCATGTCAG 


1200 


CCCAGGAAGA 


1260 


TGATCGCCGC 


1320 


AT CGGCGCAA 


1380 


AGAACTCCAT 


1440 


GTGTAGGGCT 


1500 


TGATGAGTGA 


1560 


AAACACAGAC 


162 0* 


ATGAAGG CAT 


1680 


AGCCCACGGG 


1740 


CCTCCCTTCC 


1800 


GCCTCCTTAA 


1860 


CTTTACCTCC 


1920 


GCATGCAGGT 


1980 


TGTGGAGGGG 


2040 


TAT CAGAGTC 


2100 


CACTGTCAGG 


2160 


GGTATTTTCT 


2220 


GACTGTGGCT 


2280 


AGGGAACCTG 


2340 


GGGTCAGCCA 


2400 


TGCTGCATGT 


2460 


GCTCCGAATC 


2520 


TTTTATTTAT 


2580 


CAGACCCTGT 


2640 
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WO 02/086443 

CTGTAAAAAA ACCAAAACCC AAAAAAAAAA AAAAAAAAAA 



PCT/US02/12476 



Seq ID NO: 42 5 Protein sequence 
Protein Accession ft : AAH10423 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



MPLSLGAEMW 
QVGQVAWARV 
DEGEYECRVS 
VTWDTEVKGT 
HVSFLAEASV 
GFPPLTTEHS 
FCLLVWWL 
EGHPDSLKDN 
AMNHFVQENG 



11 

I 

GPEAWLLLLL 
DAGEGAQELA 
TFPAGSFQAR 
TSSRSFKHSR 
RGLEDQNLWH 
GIYVCHVSNE 
MSRYHRRKAQ 
SSCSVMSEEP 
TLRAKPTGNG 



21 
I 

LLASFTGRCP 
LLHSKYGLHV 
LRLRVLVPPIi 
SAAVTSEFHL 
IGREGAMLKC 
FSSRDSQVTV 
QMTQKYEEEL 
EGRSYSTLTT 
IYINGRGHLV 



31 
I 

AGEIiETSDW 
SPAYEGRVEQ 
PSLNPGPALE 
VPSRSMNGQP 
LSEGQPPPSY 
DVLDPQEDSG 
TLTRENSIRR 
VREIETQTEL 



41 
I 

TWLGQDAKL 
PPPPRNPLDG 
EGQGLTLAAS 
LTCWSHPGL 
NWTRLDGPLP 
KQVDLVSASV 
LHSHHTDPRS 
LSPGSGRAEE 



51 



PCFYRGDSGE 
SVLLRNAVQA 
CTAEGSPAPS 
LQDQRITHIL 
SGVRVDGDTL 
VWGVIAALL 
QPEESVGLRA 
EEDQDEGIKQ 



Seq ID NO: 426 DNA sequence 

Nucleic Acid Accession #: NM_003474.2 

Coding sequence: 3 7.. 3 03 6 



85 



CACTAACGCT 
TCAAGGCTGG 
CTTTTTTAAA 
CCGGAGCTGA 
GCCCGCGTGG 
GCGACGATGG 
GCCGGTGCTC 
GCTGATGAAG 
TTCGACTCCA 
CTGATCATAA 
TATCTGCAAG 
TGTTACTACC 
TCTGGTCTCA 
AGTGCAACCA 
TGTGGATCAC 
CAGACATGGG 
GTGAT CGTGG 
CAGCGATTAA 
ATCGTGTTGG 
CCATTCACCA 
TCCCATGACA 
GCCCCAATCA 
GACAATCCCC 
AATCATGACA 
AT CATGAACG 
GACTTGGAGA 
AGGGAGTCTT 
GACTGTGGGG 
AAGCCGGACG 
GGAACAGCGT 
AGCCCTCACT 
GGCTACTGCT 
CCAGGTGCTA 
TATGGCAACT 
AAATGTGGAA 
GTTTCCATAG 
CACGTGTACT 
GCAGATGGAA 
GAGTGTGCAA 
GAGGCCCACT 
GGCCCCATCC 
TGTCTTCTTG 
TTTACAAATA 
CGTGGCTTCC 
CCGCCAGATT 
GACATCAGCA 
CTTCCTCCCC 
AAGCCTGCAC 
CCTGCAGATC 
CAATGGGAGA 
GTGCCCAGAT 
TGAAGACAGA 
GGATTTTTTT 
GCTGTGCTGT 
GCAGAATGTT 
CCATGGCAGG 
ATGGGATTCT 
CCAACTACCC 
CTCAGTTGAT 
TGTGTTTGGC 
ACACCTGGGA 
AGGAATCTTA 
TGACCCTGAG 
GGTGCTTGAT 



11 
I 

CTTCCTAGTC 
CTTGTGCCAG 
AATGAAAGGC 
CTCGCCGAGG 
GATGGTG CAG 
CAGCGCGCCC 
TGCTCGCGCC 
TTGTCAGTGC 
AGAATCATCC 
ATCTGGAAAG 
ACGGTACTGA 
ATGGACATGT 
GGGGACTTAT 
ACAGATACAA 
ATCACAACAC 
CAAGAAGGCA 
CAGACAACCG 
TAGAGATTGC 
TAGGCGTGGA 
GCCTCCATGA 
ATGCGCAGCT 
TGAGCATGTG 
TTGGTGCAGC 
CAC TGGACAG 
CTTCCACCGG 
CCAGCCTGGA 
TCGGGGGCCA 
AGCCAGAGGA 
CTGTGTGCGC 
GCAGGGACTC 
GCCCAGCCAA 
ACAATGGCAT 
AACCTGCCCC 
GTGGCAAAGT 
AAATCCAGTG 
AAACAAACAT 
TGGGCGATGA 
AAATCTGCCT 
TGCAGTGCCA 
GGGCACCTCC 
GGCAAGCAGA 
CTGCCGGATT 
AGAAGACCAC 
AACCCTGTCA 
CCTACCCACC 
GACCCCTCAA 
TCCACCGGGC 
TTAGGCAGGC 
CTCTGGCCAG 
CTGGGCTCCG 
CCACCCACAC 
AGTTTGCACT 
TAATGTT TAA 
GCTATGGTGC 
GATTACAGTG 
AAGGCTTGTT 
GGACAGGATG 
CCAGCTGTGC 
TTTCTGGATT 
TTTCAGGGAG 
GAAATCTGGC 
AGGTGTAGCC 
CTGACCAGCC 
AGAAATGCCA 



21 



31 



CCCGGGCCAA 
AACGGCGCGC 
TAGAAGAGCT 
CAGGAAATCC 
CGCTCGCCGC 
GCTGCCCGTG 
CTGCGAGGCC 
CTCTGTTCGG 
AGAAGTGCTG 
AAATGAAGGT 
TGTCTCCCTC 
ACGGGGATAT 
TGTGTTTGAA 
ACTCTTCCCA 
ACCAAACCTC 
TAAAAGAGAG 
AGAGT TTCAG 
TAATCACGTT 
AGTGTGGAAT 
ATTTCTGGAC 
TGTCAGTGGG 
CACGGCAGAC 
CGTGACCCTG 
GGGCTGTAGC 
GTACCCATTT 
GAAAGGAATG 
GAAGTGTGGG 
ATGTATGAAT 
ACATGGGCTG 
CAGCAACTCC 
CGTGTACCTG 
CTGCCAGACT 
TGGGATCTGC 
CTCGAAGAGT 
TCAAGGAGGT 
CCCCCTGCAG 
CATGCCGGAC 
GAATCGTCAA 
CGGCAGAGGG 
CTTCTGTGAC 
TAACCAAGGT 
TGTGGTTTAT 
CATTGAAAAA 
GGCTCACCTC 
GAAGGACAAT 
CGGCCTGAAT 
CCCACGTGCA 
CCAGGGGACC 
AACAACTCGG 
CCTGGCACCC 
CGCCTATATT 
ATCTTTCAGC 
AACATCATTA 
TCTGTCTACT 
CAGTGCGCTG 
GTGCTTTTAG 
TGTTTGCTTT 
TTATGGTACC 
CCCCATCTCA 
GCCCTGTGCC 
TTCTGGCCAG 
ACACCAGGAT 
GTGAGCATGT 
AGCACTTCTT 



CTCGGACAGT 
GCGCGACGCA 
CAGCGGCGGC 
CTCCGGTCGC 
CGGGCCCGAG 
TCCCCCGCCC 
CGAGGGGTGA 
AGTGGGGACC 
AATATTCGAC 
CTCATTGCCA 
GCTCGAAATT 
TCTGATTCAG 
AATGAAAGCT 
GCGAAGAAGC 
GCTGCAAAGA 
ACCCTCAAGG 
AGGCAAGGAA 
GACAAGTTTT 
GACATGGACA 
TGGAGGAAGA 
GTTTATTTCC 
CAGTCTGGGG 
GCACATGAGC 
TGT CAAATGG 
CCCATGGTGT 
GGGGTGTGCC 
AACAGATTTG 
CGCTGCTGCA 
TGCTGTGAAG 
TGTGACCTCC 
CACGATGGGC 
CACGAGCAGC 
TTTGAGAGAG 
TCCTTTGCCA 
GCCAGCCGGC 
CAAGGAGGCC 
CCAGGGCTTG 
TGTCAAAATA 
GTGTGCAACA 
AAGTTTGGCT 
TTAACCATAG 
CTCAAAAGGA 
CTAAGGTGTG 
GGCCACCTTG 
CCCAGGAGAT 
GTCCCTCAGC 
CCTAGCGTCC 
TGTAAGCCAA 
CTCACTCATG 
CTCAGACCTG 
AAGTGAGAAG 
TCCAGTTGGA 
CTATAAGAAC 
TGCACAGGTA 
TAGTAGGCAT 
TATTTTAGTG 
CTGAT CAAGG 
AGATGCAGCT 
GGCCAGAGCC 
CCTTGACAAC 
GAAGCTTTGG 
AGAGACTGGA 
TTGGAAGGGG 
TTTCTCGCTG 



41 
I 

TTGCTCATTT 

CGCACACACA 

GCGGGCCGTG 

GACGCCCGGC 

AGCTGCTGCA 

GCGCCCTCCT 

GCTTATGGAA 

TCTGGATCCC 

TACAACGGGA 

GCAGTTTCAC 

ACACGGTAAT 

CAGTCAGTCT 

ATGTCTTAGA 

TGAAAAGCGT 

ATGTGTTTCC 

CAACTAAGTA 

AAGAT CTGGA 

ACAGACCACT 

AATGCTCTGT 

TGAAGCTTCT 

AAGGGACCAC 

GAATTGTCAT 

TGGGCCACAA 

CGGTTGAGAA 

TCAGCAGTTG 

TGTTTAACCT 

TGGAAGAAGG 

ATGCCACCAC 

ACTGCCAGCT 

CAGAGTTCTG 

ACTCATGTCA 

AGTGTGT CAC 

TCAATTCTGC 

AATGCGAGAT 

CAGTCATTGG 

GGATTCTGTG 

TGCTTGCAGG 

TTAGTGTCTT 

ACAGGAAGAA 

TTGGAGGAAG 

GAATTCTGGT 

AGACCTTGAT 

TGCGCCCTTC 

GAAAAGGCCT 

TGCTGCAGTG 

CCCAGTCAAC 

CTGCCAGACC 

ACCCCCCTCA 

CCTTGGCCAG 

CTCCACAATA 

CCGACACCTT 

GTTTTTTGTA 

TTTGAGCTAC 

CTTGTAAATT 

TTTTACCATC 

AACTTGAAAT 

CCTTATTGGA 

CAAGAGATCC 

AAGGGGCTTC 

TGGCAGGCAG 

TGAGAACCTG 

ACACTAGACA 

TCTGTAGTGT 

TCCTTTCTAG 



51 



ATTGCAACGG 
CGGGGGGAAA 
CGCGAGGGCT 
CCCGCTCGGC 
CTGAAGGCCG 
GCTCGCCCTG 
CGAAGGAAGA 
AGTGAAGAGC 
AAGCAAAGAA 
GGAAACCCAC 
TCTGGGTCAC 
CAGCACGTGT 
ACCAATGAAA 
CCGGGGATCA 
ACCACCCTCT 
TGTGGAGCTG 
AAAAGTTAAG 
GAACATTCGG 
AAGT CAGG AC 
ACCTCGCAAA 
CATCGGCATG 
GGACCATTCA 
TTTCGGGATG 
AGGAGGCTGC 
CAGCAGGAAG 
GCCGGAAGTC 
AGAGGAGTGT 
CTGTACCCTG 
GAAGCCTGCA 
CACAGGGGCC 
GGATGTGGAC 
ACTCTGGGGA 
AGGTGATCCT 
GAGAGATGCT 
TACCAATGCC 
CCGGGGGACC 
CACAAAGTGT 
TGGGGTTCAC 
CTGCCACTGC 
CACAGACAGC 
GACCATCCTG 
ACGACTGCTG 
CCGGCCACCC 
GATGAGGAAG 
TCAGAATGTT 
TCAGCGAGTG 
CCTGCCAGCC 
GAAGCCTCTG 
GACCCCAGGA 
TCCACACCAA 
TTTTCAACAG 
CCAACTTTTA 
TGCCGTCAGT 
ATTAATTTAT 
ACTGAGTTTT 
ATCCTGCTTG 
AAGCAGTCCC 
CAAGTAGAAT 
AGGTCCAGGC 
GCTCCCAGGG 
GGTTGCAGAC 
AGCCAGAACT 
CACTCAAGGC 
AGCACTGCCA 



60 
120 
180 
240 
300 
360 
420 
480 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 



345 
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CCAGTAGGTT ATTTAGCTTG GGAAAGGTGG TGTTTCTGTA AGAAACCTAC TGCCCAGGCA 3900 

CTGCAAACCG CCACCTCCCT ATACTGCTTG GAGCTGAGCA AATCACCACA AACTGTAATA 3 960 

CAATGATCCT GTATTCAGAC AGATGAGGAC TTTCCATGGG ACCACAACTA TTTTCAGATG 402 0 

TGAACCATTA ACCAGATCTA GTCAATCAAG TCTGTTTACT GCAAGGTTCA ACTTATTAAC 4080 

AATTAGGCAG ACTCTTTATG CTTGCAAAAA CTACAACCAA TGGAATGTGA TGTTCATGGG 4140 

TATAGTT CAT GTCTGCTATC ATTATTCGTA GATATTGGAC AAAGAACCTT CTCTATGGGG 4200 

CATCCTCTTT TTCCAACTTG GCTGCAGGAA TCTTTAAAAG ATGCTTTTAA CAGAGTCTGA 4260 

ACCTATTTCT TAAACACTTG CAACCTACCT GTTGAGCATC ACAGAATGTG ATAAGGAAAT 4320 

CAACTTGCTT ATCAACTTCC TAAATATTAT GAGATGTGGC TTGGGCAGCA TCCCCTTGAA 4380 

CTCTTCACTC TTCAAATGCC TGACTAGGGA GCCATGTTTC ACAAGGTCTT TAAAGTGACT 4440 

AATGGCATGA GAAATACAAA AATACT CAGA TAAGGTAAAA TGCCATGATG CCTCTGTCTT 4500 

CTGGACTGGT TTTCACATTA GAAGACAATT GACAACAGTT ACATAATTCA CTCTGAGTGT 4560 

TTTATGAGAA AGCCTTCTTT TGGGGT CAAC AGTTTTCCTA TGCTTTGAAA CAGAAAAATA 462 0 

TGTAC CAAG A ATCTTGGTTT GCCTTCCAGA AAACAAAACT GCATTTCACT TTCCCGGTGT 4680 

TCCCCACTGT ATCTAGGCAA CATAGTATTC ATGACTATGG ATAAACTAAA CACGTGACAC 4740 

AAACACACAC AAAAGGGAAC CCAGCTCTAA TACATTCCAA CTCGTATAGC ATGCATCTGT 4800 

TTATTCTATA GTTATTAAGT TCTTTAAAAT GTAAAGCCAT GCTGGAAAAT AATACTGCTG 4860 

AGATACATAC AGAATTACTG TAACTGATTA CACTTGGTAA TTGTACTAAA GCCAAACATA 4 92 0 

TATATACTAT TAAAAAGGTT TACAGAATTT TATGGTGCAT TACGTGGGCA TTGTCTTTTT 4 980 

AGATG CCCAA ATCCTTAGAT CTGGCATGTT AGCCCTTCCT CCAATTATAA GAGGATATGA 5040 
ACCAAAAAAA AAAAAAAAAA AA 

Seq ID NO: 427 Protein sequence 
Protein Accession #: NP_003465 

1 11 21 31 41 51 

| | I 1 I I 

MAARPLPVSP ARALLLALAG ALLAPCEARG VSLWNEGRAD EWSASVRSG DLWIPVKSFD 60 

SKNHPEVLNI RLQRESKELI INLERNEGLI ASSFTETHYL QDGTDVSLAR NYTVILGHCY 120 

YHGHVRGYSD SAVSLSTCSG LRGLIVFENE SYVLEPMKSA TNRYKLFPAK KLKSVRGSCG 180 

SHHNTPNLAA KNVFPPPSQT WARRHKRETL KATKYVELVI VADNREFQRQ GKDLEKVKQR 240 

LIEIANHVDK FYRPLNIRIV LVGVEVWNDM DKCSVSQDPF TSLHEFLDWR KMKLLPRKSH 3 00 

DNAQLVSGVY FQGTTIGMAP IMSMCTADQS GG I VMDHSDN PLGAAVTLAH ELGHNFGMNH 3 60 

DTLDRGCSCQ MAVEKGGCIM NASTGYPFPM VFSSCSRKDL ETSLEKGMGV CLFNLPEVRE 42 0 

SFGGQKCGNR FVEEGEECDC GEPEECMNRC CNATTCTLKP DAVCAHGLCC EDCQIiKPAGT 480 

ACRDSSNSCD LPEFCTGASP HCPANVYLHD GHSCQDVDGY CYNGICQTHE QQCVTLWGPG 540 

AKPAPGICFE RVNSAGDPYG NCGKVSKSSF AKCEMRDAKC GKIQCQGGAS RPVIGTNAVS 600 

IETNIPLQQG GRILCRGTHV YLGDDMPDPG LVLAGTKCAD GKICLNRQCQ NISVFGVHEC 660 

AMQCHGRGVC NNRKNCHCEA HWAPPFCDKF GFGGSTDSGP IRQADNQGLT IGILVTILCL 720 

LAAGFWYLK RKTLIRLLFT NKKTT I EKLR CVRPSRPPRG FQPCQAHLGH LGKGLMRKPP 780 

DSYPPKDNPR RLLQCQNVDI SRPLNGLNVP QPQSTQRVLP PLHRAPRAPS VPARPLPAKP 840 

ALRQAQGTCK PNPPQKPLPA DPLARTTRLT HALARTPGQW ETGLRLAPLR PAPQYPHQVP 900 
RSTHTAYIK 

Seq ID NO: 428 DNA sequence 

Nucleic Acid Accession #: NM_003714 

Coding sequence: 135.. 1043 

1 11 21 31 41 51 

I I I I I ! 

GAGGAGGAGG GAAAAGGCGA G C AAAAAGG A AGAGTGGGAG GAGGAGGGGA AGCGGCGAAG 60 

GAGGAAGAGG AGGAGGAGGA AGAGGGGAGC ACAAAGGATC CAGGTCTCCC GACGGGAGGT 120 

TAATACCAAG AACCATGTGT GCCGAGCGGC TGGGCCAGTT CATGACCCTG GCTTTGGTGT 180 

TGGCCACCTT TGACCCGGCG CGGGGGACCG ACGCCACCAA CCCACCCGAG GGTCCCCAAG 240 

ACAGGAGCTC CCAGCAGAAA GGCCGCCTGT CCCTGCAGAA TACAGCGGAG ATCCAGCACT 300 

GTTTGGTCAA CGCTGGCGAT GTGGGGTGTG GCGTGTTTGA ATGTTTCGAG AACAACTCTT 360 

GTGAGATTCG GGGCTTACAT GGGATTTGCA TGACTTTTCT GCACAACGCT GGAAAATTTG 420 

ATGCCCAGGG CAAGTCATTC ATCAAAGACG CCTTGAAATG TAAGGCCCAC GCTCTGCGGC 480 

ACAGGTTCGG CTGCATAAGC CGGAAGTGCC CGGCCATCAG GGAAATGGTG TCCCAGTTGC 540 

AGCGGGAATG CT ACCT CAAG CACGACCTGT GCGCGGCTGC CCAGGAGAAC ACCCGGGTGA 600 

TAGTGGAGAT GATCCATTTC AAGGACTTGC TGCTGCACGA ACCCTACGTG GACCTCGTGA 660 

ACTTGCTGCT GACCTGTGGG GAGGAGGTGA AGGAGGCCAT CACCCACAGC GTGCAGGTTC 720 

AGTGTGAGCA GAACTGGGGA AGCCTGTGCT CCATCTTGAG CTTCTGCACC TCGGCCATCC 780 

AGAAGCCTCC CACGGCGCCC CCCGAGCGCC AGCCCCAGGT GGACAGAACC AAGCTCTCCA 840 

GGGCCCACCA CGGGGAAGCA GGACATCACC TCCCAGAGCC CAGCAGTAGG GAGACTGGCC 900 

GAGGTGCCAA GGGTGAGCGA GGTAGCAAGA GCCACCCAAA CGCCCATGCC CGAGGCAGAG 960 

TCGGGGGCCT TGGGGCTCAG GGACCTTCCG GAAGCAGCGA GTGGGAAGAC GAACAGTCTG 1020 

AGTATTCTGA TATCCGGAGG TGAAATGAAA GGCCTGGCCA CGAAATCTTT CCTCCACGCC 1080 

GTCCATTTTC TTATCTATGG ACATTCCAAA ACATTTACCA TTAGAGAGGG GGGATGTCAC 1140 

ACGCAGGATT CTGTGGGGAC TGTGGACTTC ATCGAGGTGT GTGTTCGCGG AACGGACAGG 1200 

TGAGATGGAG ACCCCTGGGG CCGTGGGGTC TCAGGGGTGC CTGGTGAATT CTGCACTTAC 12 60 

ACGTACTCAA GGGAGCGCGC CCGCGTTATC CTCGTACCTT TGTCTTCTTT CCATCTGTGG 1320 

AGTCAGTGGG TGTCGGCCGC TCTGTTGTGG GGGAGGTGAA CCAGGGAGGG GCAGGGCAAG 1380 

GCAGGGCCCC CAGAGCTGGG CCACACAGTG GGTGCTGGGC CTCGCCCCGA AGCTTCTGGT 1440 

GCAGCAGCCT CTGGTGCTGT CTCCGCGGAA GTCAGGGCGG CTGGATTCCA GGACAGGAGT 1500 

GAATGTAAAA ATAAATATCG CTTAGAATGC AGGAGAAGGG TGGAGAGGAG GCAGGGGCCG 1560 

AGGGGGTGCT TGGTGCCAAA CTGAAATTCA GTTTCTTGTG TGGGGCCTTG CGGTTCAGAG 162 0 

CTCTTGGCGA GGGTGGAGGG AGGAGTGTCA TTTCTATGTG TAATTTCTGA GCCATTGTAC 1680 

TGTCTGGGCT GGGGGGGACA CTGTCCAAGG GAGTGGCCCC TATGAGTTTA TATTTTAACC 1740 

ACTGCTTCAA ATCTCGATTT CACTTTTTTT ATTTATCCAG TTATATCTAC ATATCTGTCA 1800 

TCTAAATAAA TGGCTTTCAA ACAAAGCAAC TGGGTCATTA AAACCAGCTC AAAGGGGGTT 1860 

TAAAAAAAAA AAAACCAGCC CATCCTTTGA GGCTGATTTT TCTTTTTTTT AAGTTCTATT 1920 

TTAAAAG CT A TCAAACAGCG ACATAGCCAT ACATCTGACT GCCTGACATG GACTCCTGCC 1980 

CACTTGGGGG AAACCTTATA CCCAGAGGAA AATACACACC TGGGGAGTAC ATTTGACAAA 2040 

TTTCCCTTAG GATTTCGTTA TCTCACCTTG ACCCTCAGCC AAGATTGGTA AAGCTGCGTC 2100 

CTGGCGATTC CAGGAGACCC AGCTGGAAAC CTGGCTTCTC CATGTGAGGG GATGGGAAAG 2160 

GAAAGAAGAG AATGAAGACT ACTTAGTAAT TCCCATCAGG AAATGCTGAC CTTTTACATA 2220 



346 



WO 02/086443 

AAATCAAGGA GACTGCTGAA AATCTCTAAG GGACAGGATT TTCCAGATCC TAATTGGAAA 
TTTAGCAATA AGGAGAGGAG TCCAAGGGGA CAAATAAAGG CAGAGAGAGA GAGAGAGAGA 
GGGAGAGGAA GAAAAGAGAG AGAGAAAAGA GCCTCGTGCC 



2280 
2340 



PCT/US02/12476 



Seq ID NO: 42 9 Protein sequence 
Protein Accession #: NP 003705 



10 



15 



i 
I 

MCAERLGQFM 
GDVGCGVFEC 
ISRKCPAIRE 
CGEEVKEAIT 
EAGHHLPEPS 
RR 



11 

1 

TLALVLATFD 
FENNSCEIRG 
MVSQLQRECY 
HSVQVQCEQN 
SRETGRGAKG 



21 
I 

PARGTDATNP 
LHG I CMTFLH 
LKHDLCAAAQ 
WGSLCSILSF 
ERGSKSHPNA 



31 
I 

PEGPQDRSSQ 
NAGKFDAQGK 
ENTRVIVEMI 
CTSAIQKPPT 
HARGRVGGLG 



.41 



QKGRLSLQNT 
SFIKDALKCK 
HFKDLLLHEP 
APPERQPQVD 
AQGPSGSSEW 



51 
1 

AE I QHCLVNA 60 

AHALRHR FGC 120 

YVDLVNLLLT 180 

RTPCLSRAHHG 240 

EDEQSEYSDI 300 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 
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Seq ID NO: 43 0 DNA sequence 

Nucleic Acid Accession #: NM_005940 

Coding sequence: 23.. 1489 



1 
I 

AAGCCCAGCA 
CGCCCTCCTG 
TCTGCCGCCG 
AGCCCTGCCC 
CAGCCTCAGG 
CCGACAGAAG 
GATCCTTCGG 
CCTAAAGGTA 
TGACAT CATG 
TGGGGGCATC 
CGACTATGAT 
AGCCCATGAA 
GTCCGCCTTC 
TCAACACCTA 
CCAGGCTGGG 
CTGTGAGGCC 
GGGCTTTGTG 
TCGCCACTGG 
CATTTGGTTC 
CCCCGCACCC 
GGGTCCCGAG 
CAGCACCCGG 
CTCTGAGATC 
CCTCTACTGG 
GGGTCCTGAC 
ATGCCCTCAG 
ATCTTTGTGG 
GGTGGGGTAC 
AGCGACTGTC 
GGGACCCGCT 
GTAGCACCAT 
TCCTTCCAGG 
TGAGCAACTG 
ATCTGTCTGC 
GTTCACAGTC 
CAACATACCT 
ATCCTCCAAA 
TTTTTAAACT 



11 

I 

GCCCCGGGGC 
CCCCCGATGC 
GACGTCCACC 
AGTAGCCCGG 
CCTCCCCGCT 
AGGTTCGTGC 
TTCCCATGGC 
TGGAGCGATG 
ATCGACTTCG 
CTGGCCCATG 
GAGACCTGGA 
TTTGGCCACG 
TACACCTTTC 
TATGGCCAGC 
ATAGACACCA 
TCCTTTGACG 
TGGCGCCTCC 
CAGGGACTGC 
TTCCAAGGTG 
CTCACCGAGC 
AAGAACAAGA 
CGTGTAGACA 
GACGCTGCCT 
AAGTTTGACC 
TTCTTTGGCT 
GGGTGCTGAC 
CTGTGGGCAC 
AACCAC CAT G 
TCAGACTGGG 
ATGCAGGTCC 
GGCAGGACTG 
GGCTGGCACT 
GGCTGTAGGG 
CTTCTGGCTG 
AAATGGGGAG 
CAATCCTGTC 
GCCATTGTAA 
GAGGATTGTC 



21 
I 

GGATGGCTCC 
TGCTGCTGCT 
ACCTCCATGC 
CACCTGCCCC 
GTGGCGTGCC 
TTTCTGGCGG 
AGTTGGTGCA 
TGACGCCACT 
CCAGGTACTG 
CCTTCTTCCC 
CTATCGGGGA 
TGCTGGGGCT 
GCTACCCACT 
CCTGGCCCAC 
ATGAGATTGC 
CGGTCTCCAC 
GTGGGGG CCA 
CCAGCCCTGT 
CTCAGTACTG 
TGGGCCTGGT 
TCTACTTCTT 
GTCCCGTGCC 
TCCAGGATGC 
CTGTGAAGGT 
GTGCCGAGCC 
CCCTGCCAGG 
CAGGCATGGG 
ACAACTGCCG 
CAGGGAGGCT 
TGGCAAACCT 
GGGGAACTGG 
GAAG CAAGGG 
CAGGGCCACT 
ACAAT CCTGG 
GGGTATTCTT 
CCAGGCCGGA 
ATGTGTGTAC 
ATTAAACACA 



31 



41 



51 



GGCCGCCTGG 
GCTCCAGCCG 
CGAGAGGAGG 
TGCCACGCAG 
CGACCCATCT 
GCGCTGGGAG 
GGAGCAGGTG 
CACCTTTACT 
GCATGGGGAC 
CAAGACTCAC 
TGACCAGGGC 
GCAGCACACA 
GAGTCTCAGC 
TGTCACCTCC 
ACCGCTGGAG 
CATCCGAGGC 
GCTGCAGCCC 
GGACGCTGCC 
GGTGTACGAC 
GAGGTTCCCG 
CCGAGGCAGG 
CCGCAGGGCC 
TGATGGCTAT 
GAAGGCT CTG 
TGCCAACACT 
CCACGAATAT 
ACTGAGCCCA 
GGAGGGCCAC 
TTGGCATGAC 
GGCTGCCCTG 
AGTGTCCTTG 
TGCTGGGGCC 
TCCTGAGGTC 
AAATCTGTTC 
CATGCAGGAG 
TCCTCCTGAA 
AGTGTGTATA 
GTTGTTTTCT 



CTCCGCAGCG 
CCGCCGCTGC 
GGGCCACAGC 
GAAGCCCCCC 
GATGGGCTGA 
AAGACGGACC 
CGGCAGACGA 
GAGGTG CACG 
GACCTGCCGT 
CGAGAAGGGG 
ACAGACCTGC 
ACAGCAG CCA 
CCAGATGACT 
AGGACCCCAG 
CCAGACGCCC 
GAGCTCTTTT 
GGCTACCCAG 
TTCGAGGATG 
GGTGAAAAGC 
GTCCATGCTG 
GACTACTGGC 
ACTGACTGGA 
GCCTACTTCC 
GAAGGCTTCC 
TTCCTCTGAC 
CAGGCTAGAG 
TGTCTCCTGC 
GCAGGTCGTG 
TTAAGAGGAA 
TCTCATCCCT 
CTGTATCCCT 
CCATGGCCTT 
AGGTCTTGGT 
TCCAGAATCC 
ACCCCAGGCC 
GCCCTTTTCG 
AACCTTCTTC 



CGGCCGCGCG 6 0 

TGGCCCGGGC 12 0 

CCTGGCATGC 180 

GGCCTGCCAG 240 

GTGCCCGCAA 3 00 

TCACCTACAG 3 60 

TGGCAGAGGC 42 0 

AGGGCCGTGC 4 80 

TTGATGGGCC 540 

ATGTCCACTT 60 0 

TGCAGGTGGC 660 

AGGCCCTGAT 72 0 

GCAGGGGCGT 7 80 

CCCTGGGCCC 840 

CGCCAGATGC 900 

TCTTCAAAGC 960 

CATTGGCCTC 102 0 

CCCAGGGCCA 1080 

CAGTCCTGGG 1140 

CCTTGGTCTG 12 0 0 

GTTTCCACCC 12 60 

GAGGGGTGCC 132 0 

TGCGCGGCCG 13 80 

CCCGTCTCGT 1440 

CATGGCTTGG 1500 

ACCCATGGCC 15 60 

AGGGGGATGG 1620 

GTCACCTGCC 1680 

GGGCAGTCTT 1740 

GTCCCTCAGG 18 00 

GTTGTGAGGT 18 60 

CAGCCCTGGC 192 0 

AGGTGCCTGC 1980 

AGGCCAAAAA 2 040 

CTGGAGGCTG 210 0 

CAGCACTGCT 2160 

TTCTTTTTTT 222 0 



Seq ID NO: 431 Protein sequence 
Protein Accession #: NP 005931 



MAPAAWLRSA 
PAPATQEAPR 
LVQEQVRQTM 
FFPKTHREGD 
YPLSLSPDDC 
VSTIRGELFF 
QYWVYDGEKP 
PVPRRATDWR 
AEPANTFL 



11 

I 

AARALLPPML 
PASSLRPPRC 
AEALKVWSDV 
VHFDYDETWT 
RGVQHLYGQP 
FKAGFVWRLR 
VLGPAPLTEL 
GVPSEIDAAF 



21 
I 

LLLLQPPPLL 
GVPDPSDGLS 
TPLTFTEVHE 
IGDDQGTDLL 
WPTVTSRTPA 
GGQLQPGYPA 
GLVRFPVHAA 
QDAD GYAYFL 



31 
I 

ARAL P PDVHH 
ARNRQKRFVL 
GRADIMIDFA 
QVAAHEFGHV 
LGPQAGIDTN 
LASRHWQGIjP 
LWGPEKNKI 
RGRLYWKFDP 



41 

I 

LHAERRGPQP 
SGGRWEKTDL 
RYWHGDDLPF 
LGLQHTTAAK 
EIAPLEPDAP 
SPVDAAFEDA 
YFFRGRDYWR 
VKVKALEGFP 



51 

i 

WHAALPSSPA 60 

TYRILRFPWQ 120 

DGPGGILAHA 180 

ALMSAFYTFR 240 

PD ACE A S FDA 300 

QGHIWFFQGA 360 

FHPSTRRVDS 42 0 

RLVGPDFFGC 480 



Seq ID NO: 432 DNA sequence 

Nucleic Acid Accession #: NM_024022 

Coding sequence: 202.. 1563 



ACCGGGCACC 
GGAAAGGGCT 
CCATCTACAT 
AGAGGTCCTG 
TCATTCCGAT 



11 
I 

GGACGGCTCG 
GTGTTTATGG 
TTTTGGGACT 
AAATAGTCAC 
CGCTTTTTGG 



21 
I 

GGTACTTTCG 
GAAGCCAGTA 
CGGGAATTAT 
CATGGGGGAA 
CCTTGATGAT 



31 
I 

TTCTTAATTA 
ACACTGTGGC 
GAGGTAGAGG 
AATGATCCGC 
TTGAAAATAA 



41 
I 

GGTCATGCCC 
CTACTATCTC 
TGGAGGCGGA 
CTGCTGTTGA 
GTCCTGTTGC 



51 



GTGTGAGCCA 60 

TTCCGTGGTG 120 

GCCGGATGTC 180 

AGCCCCCTTC 240 

ACCAGATGCA 3 00 



347 



10 



15 



20 



25 



30 



35 



WO 02/086443 

GATGCTGTTG CTGCACAGAT 
ATTGGGATCA TTGCATTGAT 
TCAGGGAAGT ACAGATGTCG 
GGAGTCTCGG ATTGCAAAGA 
AATGCCGTGC TCCAGGTGTT 
AAGGGTCACT ACGCAAATGT 
GATAACCTCA GAGTGAGCTC 
CACCTCTTGC CAGATGACAA 
TGTGCCTCTG GCCACGTGGT ( 
AGCTCACGCA TCGTGGGTGG 
CTTCAGTTCC AGGGCTACCA 
ACTGCTGCAC ACTGTGTTTA 
CTAGTTTCCC TGTTGGACAA 
AG CAAGTACA AGCCAAAGAG 
CTCACGTTCA ATGAAATGAT 
GATGGAAAAG TGTGCTGGAC 
CCTGTCCTGA ACCACGCGGC 
GTGTACGGTG GCATCATCTC 
GACAGCTGCC AGGGGGACAG 
TTAGTGGGAG CGACCAGCTT 
ACCCGTGTCA CCTCCTTCCT 
TGAAGAGGAA GGGGACAAGT 
TCCCCTGGAC TCCCGTGTAG 
CGGCACCAGT AGCAGGCCCG 
GCTGCTTTTT GTTTTTTGTT 
GCAGTGGCGA AATCCCTGCT 
CCTCAGCTTC CCCAGTAGCT 
TATTTTTAGT AGAGACAGGG 
CAAATGATGT GCCTGCTTCA 
CCTAGCCTCA CGCTCCTTTC 
GCGGCCTTTC CCACTGGTCC 
AGATAAGCAG TTATGTGACC 
CCAGCCCAGA AGTGCAGAAC 
AACCCACCCT TTCTACTTCC 
ACTCGTTTAA GGCCTATTTT 
TCCTTTGATT CCAAATAATA 
AAAAA 



CCTGTCACTG 
ATTAGCACTG 
CTCATCCTTT 
CGGGGAGGAC 
CACAGCTGCT 
TGCCTGTGCC 
GCTGGAGGGG 
GGTGACTGCA 
TACCTTGCAG 
AAACATGTCC 
CCTGTGCGGG 
TGACTTGTAC 
TCCAGCCCCA 
GCTGGGCAAT 
CCAGCCTGTG 
GTCAGGATGG 
CGTCCCTTTG 
CCCCTCCATG 
CGGGGGGCCC 
TGGCATCGGC 
GGACTGGATC 
AGCCACCTGA 
GAACCTGCAC 
AAAGAGGCAC 
TTTTTGAGGT 
CACTGCAGCC 
GGGACCACAG 
TTTCACCATG 
GCCTCCCACA 
TGATCTTCAC 
ATCTGGTTTT 
TCACGTGCAA 
TGCAGTCACT 
AAGACTTATT 
CATGATTTCT 
TGTTTCCTTC 



CTGCCATTGA 
GCCATTGGTC 
AAGTGTATCG 
GAGTACCGCT 
TCGTGGAAGA 
CAACTGGGTT 
CAGTTCCGGG 
TTACACCACT 
TGCACAGCCT 
TTGCTCTCGC 
GGCTCTGTCA 
CTCCCCAAGT 
TCCCACTTGG 
GACATCGCCC 
TGCCTGCCCA 
GGGGCCACAG 
ATTTCCAACA 
CTCTGCGCGG 
CTGGTGTGTC 
TGCGCAGAGG 
CACGAGCAGA 
GTTCCTGAGG 
ACGAGCAGAC 
CCTTCCATCT 
GGAGTCTCGG 
TCCGCTTCCC 
GTGCCCGCCA 
TTGGCCAGGC 
GTGCTGGGAT 
TAAGAACAAA 
CTCTCCAGGG 
AGCCACCAAC 
GCACGTTTTC 
TTCACATGTG 
TTGTAGCATT 
CCTCAAAAAA 



AGTTTTTTCC 
TGGGCATCCA 
AGCTGATAGC 
GTGT CCGGGT 
CCATGTGCTC 
TCCCAAGCTA 
AGGAGTTTGT 
CAGTATATGT 
GTGGTCATAG 
AGTGGCCCTG 
TCACGCCCCT 
CATGGACCAT 
TGGAGAAGAT 
TTATGAAGCT 
ACTCTGAAGA 
AGGATGGAGG 
AGATCTGCAA 
GCTACCTGAC 
AAGAGAGGAG 
TGAACAAGCC 
TGGAGAGAGA 
TGATGAAGAC 
ACCCTTGGAG 
GATTCCAGCA 
TCTGTTGCCC 
TGGTTCAAGC 
CCACACCCAA 
TGCTCTCAAA 
TACAGG CATG 
AGAAGCAGCA 
GTCTTGCAAA 
AGCCACTCAG 
ATCTCTAGGG 
GGGAGGTTAA 
TGGTGCTTGA 
AAAAAAAAAA 



AATCAT CGTC 3 60 

CTTCGACTGC 42 0 

TCGATGTGAC 4 80 

GGGTGGTCAG 540 

CGATGACTGG 60 0 

TGTGAGTTCA 660 

GTCCATCGAT 720 

GAGGGAGGGA 780 

AAGGGGCTAC 840 

GCAGGCCAGC 900 

GTGG AT CAT C 960 

CCAGGTGGGT 102 0 

TGTCTACCAC 10 8 0 

GGCCGGGCCA 1140 

GAACTTCCCC 12 00 

TGACGCCTCC 12 60 

CCACAGGGAC 132 0 

GGGTGGCGTG 13 80 

GCTGTGGAAG 1440 

TGGGGTGTAC 150 0 

CCTAAAAACC 1560 

AGCCCGATCC 162 0 

CTCTGAGTTC 1680 

CAACCTT CAA 1740 

AGGCTGGAGT 1800 

GATTCTCTTG 18 60 

CTAATTTTTG 192 0 

CCCCTGACCT 1980 

GGCCACCACG 2 040 

ACTTGCAAGG 2100 

ATTCCTGACG 2160 

AAAAGACGCA 2220 

ACCAGAACCA 2280 

TCTAGGAATG 2340 

CGTATTATTG 240 0 

AAAAAAAAAA 2460 



PCT/US02/12476 



40 



45 



50 



Seq ID NO: 433 Protein sequence 
Protein Accession #: NP_076927 



11 



MGENDPPAVE 
LALAIGLGIH 
TAASWKTMCS 
VTALHHSVYV 
LCGGSVITPL 
LGNDIALMKL 
VPLISNKICN 
G I GCAEVNKP 



APFSFRSLFG 
FDCSGKYRCR 
DDWKGHYANV 
REGCASGHW 
WIITAAHCVY 
AGPLTFNEMI 
HRDVYGGIIS 
GVYTRVTSFL 



21 
t 

LDDLKISPVA 
SSFKCIELIA 
ACAQLGFPSY 
TLQCTACGHR 
DLYLPKSWTI 
QPVCLPNSEE 
PSMLCAGYLT 
DWIHEQMERD 



31 
1 

PDADAVAAQI 
RCDGVSDCKD 
VSSDNLRVSS 
RGYSSRIVGG 
QVGLVSLLDN 
NFPDGKVCWT 
GGVDSCQGDS 
LKT 



41 
i 

LSLLPLKFFP 
GEDEYRCVRV 
LEGQFREEFV 
NMSLLSQWPW 
PAPSHLVEKI 
SGWGATEDGG 
GGPLVCQERR 



51 
I 

IIVIGIIALI 60 

GGONAVLQVF 120 

SIDHLLPDDK 180 

QASLQFQGYH 2 40 

VYHSKYKPKR 3 0 0 

DASPVLNHAA 3 60 

LWKLVGATSF 420 



55 



Seq ID NO: 434 DNA sequence 

Nucleic Acid Accession #: NM_000493.2 

Coding sequence: 97.. 213 9 



60 



65 



70 



75 



80 



85 



1 
I 

CACCTTCTGC 
CCAGGAACTC 
CTGCTAGTAT 
ACAGGCATAA 
AAGAGTAAAG 
GGACCTCGAG 
GGACTCCAAG 
GGTGTGCCAG 
GTTGGACCAG 
CCGGCTGGAA 
CCCAGGGGCT 
GGGGAAATGG 
GGTCCCACAG 
GGACAGCCAG 
CCAGGTCCCC 
GCTGGAGCCC 
ATAGCTGGGC 
GAAAGAGGAC 
GGTCTTCCTG 
AAAGGCATCC 
CCTGCAGGAT 
GGGTACCCAG 
AAAGGTGATC 
GCAAAGGGAA 
GGTACTAGAG 
CCAGGAAGTC 
ACCGGGCCAC 
CCCCCTGGGC 
GGCCAAAGGC 



11 
I 

ACTGCTCATC 
CCAGCACGCA 
CCTTGAACTT 
AAGGCCCACT 
GTATAGCAGT 
GGCACCCAGG 
GAGAGCCAGG 
GACTCCCAGG 
CTGGCCTACC 
TTTCTGTGCC 
TTCCTGGAGA 
GATATGGTGC 
GACCATCTGG 
GCATCAAAGG 
AAGGCCCTCC 
CAGGCCAGCC 
CCCCAGGGCC 
CTGCTGGCCT 
GGAAGCCAGG 
CGGGTAGCCA 
ACCCTGGGGC 
GAAAACCAGG 
CTGGAGTTGG 
TGCCCGGACA 
GCCCTATTGG 
CCGGTCCTCC 
CAGGGCCTCC 
CTCCAGGCCC 
CCAGTCTTTC 



21 



TGGGCAGAGG 
GAATCCATCT 
GGTTCATGGA 
ACCCAACACC 
AAGAGGAGAG 
TCCTTCTGGA 
GTTGCCAGGA 
AAAACCAGGA 
AGGACCCCGG 
AGGAAAACCT 
AAAGGGTGCA 
TCCTGGTCGT 
CCCTCCTGGA 
TGATAGAGGT 
TGGGGAACGA 
AGGGATTCCA 
TCCTGGCTTT 
TCCTGGGGGT 
TCTGACTGGA 
TGGTCTCCCA 
TAAGGGTGAA 
TCTCGATGGT 
AGGACCTCCT 
CAATGGAGAG 
GCCACCAGGC 
TGGCCCAGCT 
AGGTCCAAGA 
ACCAGGTCAA 
TGGGACCCCT 



31 
I 

AAG CTTCAGA 
GAGAATATGC 
GTGTTTTACG 
AAGACACAGT 
CAAGGT ACT C 
CCACCAGGAA 
CCACCGGGAC 
GAGAGAGGAC 
GGCCCACCAG 
GGACAACAGG 
CCAGGAGTCC 
CCAGGTGAGA 
GTGGGAAAAA 
TTTCCGGGAG 
GGGCCAGAAG 
GGAACAAAAG 
GGGAAACCAG 
CCAGGTGCCA 
CCCCCTGGGA 
GGCCCTAAAG 
AGGGGTTCCC 
CCTAAGGGTA 
GGTCTCCCAG 
GCTGGCCCAA 
ATTCCAGGAT 
GGCATAGCAA 
GGCCACTCTG 
GCAGTCATGC 
CTTGTTAGTG 



41 
I 

AAGCTGCCAA 
TGCCACAAAT 
CTGAACGATA 
TCTTCATTCC 
CTGGTCCACC 
AACCAGGCTA 
CATCAGCTGT 
CATATGGACC 
GACCACCTGG 
GACCCACAGG 
CTGGTATGAA 
GGGGTCTTCC 
GAGGTGAAAA 
AAATGGG AC C 
G CAT T GG AAA 
GTCTCCCTGG 
GCTTGCCAGG 
AAGGGGAACA 
ATATGGGACC 
GTGAGACAGG 
CTGGGTCAGA 
ACCCAGGGTT 
GCCCTGTGGG 
GAGGTGCCCC 
TCCCTGGGTC 
CTAAGGGCCT 
GAGAGCCTGG 
CTGAGGGTTT 
CCAACCAGGG 



51 



GGCACCATCT 60 

ACCCTTTTTG 120 

CCAAATGCCC 180 

CTACACCATA 240 

AGGCCCTGCT 3 0 0 

CGGAAGTCCT 3 60 

AGGGAAACCA 420 

AAAAGGAGAT 480 

AATCCCTGGA 540 

AGCCCCAGGA 60 0 

TGGACAGAAA 660 

AGGCCCTCAG 720 

TGGGGTTCCA 780 

AATTGGCCCA 840 

GCCAGGAGCT 90 0 

GGCTCCAGGA 960 

CCTGAAGGGA 1020 

AGGGCCAGCA 1080 

CCAAGGACCA 1140 

GCCAGCTGGG 12 00 

TGGAAAACCA 12 60 

ACCAGGTCCA 1320 

CCCAGCAGGA 1380 

TGGAATACCA 1440 

TAAAGGGGAT 1500 

CAATGGACCC 1560 

TCTTCCAGGG 1620 

TATAAAGGCA 1680 

GGTAACAGGA 1740 



348 



WO 02/086443 

ATGCCTGTGT CTGCTTTTAC TGTTATTCTC TCCAAAGCTT ACCCAGCAAT AGGAACTCCC 1800 

ATACCATTTG ATAAAATTTT GTATAACAGG CAACAGCATT ATGACCCAAG GACTGGAATC 1860 

TTTACTTGTC AGATACCAGG AATATACTAT TTTTCATACC ACGTGCATGT GAAAGGGACT 1920 

CATGTTTGGG TAGGCCTGTA TAAGAATGGC ACCCCTGTAA TGTACACCTA TGATGAATAC 1980 

ACCAAAGGCT ACCTGGATCA GGCTTCAGGG AGTGCCATCA TCGATCTCAC AGAAAATGAC 2040 

CAGGTGTGGC TCCAGCTTCC CAATGCCGAG TCAAATGGCC TATACTCCTC TGAGTATGTC 210 0 

CACTCCTCTT TCTCAGGATT CCTAGTGGCT CCAATGTGAG TACACCCCAC AGAGCTAATC 2160 

TAAATCTTGT GCTAGAAAAA GCATTCTCTA ACTCTACCCC ACCCTACAAA ATGCATATGG 2220 

AGGTAGGCTG AAAAGAATGT AATTTTTATT TTCTGAAATA CAGATTTGAG CTATCAGACC 2280 

AACAAACCTT CCCCCTGAAA AGTGAGCAGC AACGTAAAAA CGTATGTGAA GCCTCTCTTG 2340 

AATTTCTAGT TAGCAATCTT AAGGCTCTTT AAGGTTTTCT CCAATATTAA AAAATATCAC 2400 

CAAAGAAGTC CTGCTATGTT AAAAACAAAC AACAAAAAAC AAAGCAACAA AAAAAAAAAT 2460 

TAAAAAAAAA AACAGAAATA GAGCTCTAAG TTATGTGAAA TTTGATTTGA GAAACTCGGC 2520 

ATTTCCTTTT TAAAAAAGCC TGTTTCTAAC TATGAATATG AGAACTTCTA GGAAACATCC 2580 

AGGAGGTATC ATATAACTTT GTAGAACTTA AATACTTGAA TATTCAAATT TAAAAGACAC 2 640 

TGTATCCCCT AAAATATTTC TGATGGTGCA CTACTCTGAG GCCTGTATGG CCCCTTTCAT 2 7 00 

CAATATCTAT TCAAATATAC AGGTGCATAT ATACTTGTTA AAG CTCTT AT ATAAAAAAGC 2 7 60 

CCCAAAATAT TGAAGTTCAT CTGAAATGCA AGGTGCTTTC ATCAATGAAC CTTTT CAAAA 2 82 0 

CTTTTCTATG ATTGCAGAGA AGCTTTTTAT ATACCCAGCA TAACTTGGAA ACAGGTATCT 2 8 80 

GACCTATTCT TATTTAGTTA ACACAAGTGT GATTAATTTG ATTTCTTTAA TTCCTTATTG 2 940 

AATCTTATGT GATATGATTT TCTGGATTTA CAGAACATTA GCACATGTAC CTTGTGCCTC 3 000 

CCATTCAAGT GAAGTTATAA TTTACACTGA GGGTTTCAAA ATTCGACTAG AAGTGGAGAT 3 0 60 

ATATTATTTA TTTATGGACT GTACTGTATT TTTATATTGC TGTTTAAAAC TTTTAAGCTG 3120 

TGCCTCACTT ATTAAAGCAC AAAATGTTTT ACCTACTCCT TATTTACGAC ACAATAAAAT 3180 

AACATCAATA GATTTTTAGG CTGAATTAAT TTGAAAGCAG CAATTTGCTG TTCTCAACCA 3240 
TTCTTTCAAG GCTTTTCATT CGACACAATA AAATAAC AT C AATAG 

Seq ID NO: 435 Protein sequence 
Protein Accession #: NP_000484.2 

1 11 21 31 41 51 

1111-11 

MLPQIPFLLL. VSLNLVHGVF YAERYQMPTG IKGPLPNTKT QFFIPYTIKS KGIAVRGEQG 60 
TPGPPGPAGP RGHPGPSGPP GKPGYGSPGL QGEPGLPGPP GPSAVGKPGV PGLPGKPGER 12 0 
GPYGPKGDVG PAGLPGPRGP PGPPGIPGPA GISVPGKPGQ QGPTGAPGPR GFPGEKGAPG 180 
VPGMNGQKGE MGYGAPGRPG ERGLPGPQGP TGPSGPPGVG KRGENGVPGQ PGIKGDRGFP 240 
GEMGPIGPPG PQGPPGERGP EGIGKPGAAG APGQPGIPGT KGLPGAPGIA GPPGPPGFGK 300 
PGLPGLKGER GPAGLPGGPG AKGEQGPAGL PGKPGLTGPP GNMGPQGPKG IPGSHGLPGP 360 
KGETGPAGPA GYPGAKGERG SPGSDGKPGY PGKPGLDGPK GNPGLPGPKG DPGVGGPPGL 420 
PGPVGPAGAK GMPGHNGEAG PRGAPGIPGT RGPIGPPGIP GFPGSKGDPG SPGPPGPAGI 480 
ATKGLNGPTG PPGPPGPRGH SGEPGLPGPP GPPGPPGQAV MPEGFIKAGQ RPSLSGTPLV 540 
SANQGVTGMP VSAFTVILSK AYPAIGTPIP FDKILYNRQQ HYDPRTGIFT CQIPGIYYFS 600 
YHVHVKGTHV WVGLYKNGTP VMYTYDEYTK GYLDQASGSA IIDLTENDQV WLQLPNAESN 660 
GLYSSEYVHS SFSGFLVAPM 



Seq ID NO: 43 6 DNA sequence 

Nucleic Acid Accession #: XM_062811 

Coding sequence: 1..888 

1 11 21 31 41 51 

I I I I I I 

ATGTGGGGCG CTCGCCGCTC GTCCGTCTCC TCATCCTGGA ACGCCGCTTC GCTCCTGCAG 60 

CTGCTGCTGG CTGCGCTGCT GGCGGCGGGG GCGAGGGCCA GCGGCGAGTA CTGCCACGGC 120 

TGGCTGGACG CGCAGGGCGT CTGGCGCATC GGCTTCCAGT GTCCCGAGCG CTTCGACGGC 180 

GGCGACGCCA CCATCTGCTG CGGCAGCTGC GCGTTGCGCT ACTGCTGCTC CAGCGCCGAG 240 

GCGCGCCTGG ACCAGGGCGG CTGCGACAAT GACCGCCAGC AGGGCGCTGG CGAGCCTGGC 3 00 

CGGGCGGACA AAGACGGCCC CGACGGCTCG GCAGTGCCCA TCTACGTGCC GTTCCTCATT 3 60 

GTTGGCTCCG TGTTTGTCGC CTTTATC AT C TTGGGGTCCC TGGTGGCAGC CTGTTGCTGC 42 0 

AGATGTCTCC GGCCTAAGCA GGATCCCCAG CAGAGCCGAG CCCCAGGGGG TAACCGCTTG 480 

ATGGAGACCA TCCCCATGAT CCCCAGTGCC AGCACCTCCC GGGGGTCGTC CTCACGCCAG 540 

TCCAGCACAG CTGCCAGTTC CAGCTCCAGC GCCAACTCAG GGGCCCGGGC GCCCCCAACA 60 0 

AGGTCACAGA CCAACTGTTG CTTGCCGGAA GGGACCATGA ACAACGTGTA TGTCAACATG 660 

CCCACGAATT TCTCTGTGCT GAACTGTCAG CAGGCCACCC AGATTGTGCC ACATCAAGGG 720 

CAGTATCTGC ATCCCCCATA CGTGGGGTAC ACGGTGCAGC ACGACTCTGT GCCCATGACA 780 

GCTGTGCCAC CTTTCATGGA CGGCCTGCAG CCTGGCTACA GGCAGATTCA GTCCCCCTTC 840 
CCTCACACCA ACAGTGAACA GAAGATGTAC CCAGCGGTGA CTGTATAA 



Seq ID NO: 43 7 Protein sequence 
Protein Accession #: XP 062811 



1 11 21 31 41 51 

| ] I I I I 

MWGARRSSVS SSWNAASLLQ LLLAALLAAG ARASGEYCHG WLDAQGVWRI GFQCPERFDG 60 
GDATICCGSC ALRYCCSSAE ARLDQGGCDN DRQQGAGEPG RADKDGPDGS AVPIYVPFLI 120 
VGSVFVAFII LGSLVAACCC RCLRPKQDPQ QSRAPGGNRL METIPMIPSA STSRGSSSRQ 180 
SSTAASSSSS ANSGARAPPT RSQTNCCLPE GTMNNVYVNM PTNFSVLNCQ QATQIVPHQG 240 
QYLHPPYVGY TVQHDSVPMT AVPPFMDGLQ PGYRQIQSPF PHTNSEQKMY PAVTV 



Seq ID NO: 43 8 DNA sequence 

Nucleic Acid Accession #: NM_004004.1 

Coding sequence: 1..681 

1 11 21 31 41 51 

j I I I I 1 

ATGGATTGGG GCACGCTGCA GACGAT CCTG GGGGGTGTGA ACAAACACTC CACCAGCATT 60 
GGAAAGATCT GGCTCACCGT CCTCTTCATT TTTCGCATTA TGATCCTCGT TGTGGCTGCA 120 
AAGGAGGTGT GGGGAGATGA GCAGGCCGAC TTTGTCTGCA ACACCCTGCA GCCAGGCTGC 180 



349 



WO 02/086443 

AAGAACGTGT GCTACGATCA CTACTTCCCC ATCTCCCACA TCCGGCTATG GGCCCTGCAG 
CTGATCTTCG TGTCCAGCCC AGCGCTCCTA GTGGCCATGC ACGTGGCCTA CCGGAGACAT 
GAGAAGAAGA GGAAGTTCAT CAAGGGGGAG ATAAAGAGTG AATTTAAGGA CATCGAGGAG 
ATCAAAACCC AGAAGGTCCG CATCGAAGGC TCCCTGTGGT GGACCTACAC AAGCAGCATC 
TTCTTCCGGG TCATCTTCGA AGCCGCCTTC ATGTACGTCT TCTATGTCAT GTACGACGGC 
TTCTCCATGC AGCGGCTGGT GAAGTGCAAC GCCTGGCCTT GTCCCAACAC TGTGGACTGC 
TTTGTGTCCC GGCCCACGGA GAAGACTGTC TTCACAGTGT TCATGATTGC AGTGTCTGGA 
ATTTGCATCC TGCTGAATGT CACTGAATTG TGTTATTTGC TAATTAGATA TTGTTCTGGG 
AAGTCAAAAA AGCCAGTTTA A 

Seq ID NO: 43 9 Protein sequence 
Protein Accession #: NP_003 995.1 

1 11 21 31 41 51 

I I I I I I 

MDWGTLQTIL GGVNKHSTSI GKIWLTVLFI FRIMILWAA KEVWGDEQAD FVCNTLQPGC 

KNVCYDHYFP ISHIRLWALQ LIFVSSPALL VAMHVAYRRH EKKRKFIKGE IKSEFKDIEE 

IKTQKVRIEG SLWWTYTSSI FFRVIFEAAF MYVFYVMYDG FSMQRLVKCN AWPCPNTVDC 

FVSRPTEKTV FTVFMIAVSG ICILLNVTEL CYLLIRYCSG KSKKPV 



Seq ID NO: 440 DNA sequence 

Nucleic Acid Accession #: XM_061091.1 

Coding sequence: 1..2481 

1 11 21 31 41 51 

I I I I i I 

ATGCCAAATA CTTCAGGAAC AACCAGGATT GAAATTTGGC TTCTCCAAGA GCCGCCCGGG 

CACCGAGCGC TGGTCGCCGC TCTCCTTCCG GTGAGT CCCA GCCCCGAGTT GGCTCTGGCG 

CCCGGGTACC CGCCAGTGCC GGCTGCCGAT GACCGATTCA CGCTCCCGAT GATTGGAGGT 

CAGATGCATG GTGAGAAGGT AGATCTCTGG AGCCTTGGTG TTCTTTGCTA TGAATTTTTA 

GTTGGGAAGC CTCCTTTTGA GGCAAACGAA GTCCATGTAA GCAAAGAAAC CAT CGGG AAG 

ATTTCAGCTG CCAGCAAAAT GATGTGGTGC TCGGCTGCAG TGGACATCAT GTTTCTGTTA 

GATGGGTCTA ACAGCGT CGG G AAAGGG AG C TTTGAAAGGT CCAAGCACTT TGCCATCACA 

GTCTGTGACG GTCTGGACAT CAGCCCCGAG AGGGTCAGAG TGGGAGCATT CCAGTTCAGT 

TCCACTCCTC ATCTGGAATT CCCCTTGGAT TCATTTTCAA CCCAACAGGA AGTGAAGGCA 

AGAATCAAGA GGATGGTTTT CAAAGGAGGG CGCACGGAGA CGGAACTTGC TCTGAAATAC 

CTTCTGCACA GAGGGTTGCC TGGAGGCAGA AATGCTTCTG TGCCCCAGAT CCTCATCATC 

GTCACTGATG GGAAGTCCCA GGGGGATGTG GCACTGCCAT CCAAGCAGCT GAAGGAAAGG 

GGTGTCACTG TGTTTGCTGT GGGGGT CAGG TTTCCCAGGT GGGAGGAGCT GCATGCACTG 

GCCAGCGAGC CTAGAGGGCA GCACGTGCTG TTGGCTGAGC AGGTGGAGGA TGCCACCAAC 

GGCCTCTTCA GCACCCTCAG CAGCTCGGCC ATCTGCTCCA GCGCCACGCC AGCTGGGAGC 

CCCGAGCTTG TCTTCATGGA GCGGTTAATG GGCATCTCTC TGATAGGCCC CTGTGACTCG 

CAGCCCTGCC AGAATGGAGG CACATGTGTT CCAGAAGGAC TGGACGGCTA CCAGTGCCTC 

TGCCCGCTGG CCTTTGGAGG GGAGGCTAAC TGTGCCCTGA AGCTGAGCCT GGAATGCAGG 

GTCGACCTCC TCTTCCTGCT GGACAGCTCT GCGGG CACCA CTCTGGACGG CTTCCTGCGG 

GCCAAAGTCT TCGTGAAGCG GTTTGTGCGG GCCGTGCTGA GCGAGGACTC TCGGGCCCGA 

GTGGGTGTGG CCACATACAG CAGGGAGCTG CTGGTGGCGG TGCCTGTGGG GGAGTACCAG 

GATGTGCCTG ACCTGGTCTG GAGCCT CGAT GGCATTCCCT TCCGTGGTGG CCCCACCCTG 

ACGGGCAGTG CCTTGCGGCA GGCGGCAGAG CGTGGCTTCG GGAGCGCCAC CAGGACAGGC 

CAGGACCGGC CACGTAGAGT GGTGGTTTTG CTCACTGAGT CACACTCCGA GGATGAGGTT 

GCGGGCCCAG CGCGTCACGC AAGGGCGCGA GAGCTGCTCC TGCTGGGTGT AGGCAGTGAG 

GCCGTGCGGG CAGAGCTGGA GGAGATCACA GGCAGCCCAA AGCATGTGAT GGTCTACTCG 

GATCCTCAGG ATCTGTTCAA CCAAATCCCT GAGCTGCAGG GGAAGCTGTG CAGCCGGCAG 

CGGCCAGGGT GCCGGACACA AGCCCTGGAC CTCGTCTTCA TGTTGGACAC CTCTGCCTCA 

GTAGGGCCCG AGAATTTTGC T CAGATGCAG AGCTTTGTGA GAAGCTGTGC CCTCCAGTTT 

GAGGTGAACC CTGACGTGAC ACAGGTCGGC CTGGTGGTGT ATGGCAGCCA GGTGCAGACT 

GCCTTCGGGC TGGACACCAA ACCCACCCGG GCTGCGATGC TGCGGGCCAT TAGCCAGGCC 

CCCTACCTAG GTGGGGTGGG CTCAGCCGGC ACCGCCCTGC TGCACATCTA TGACAAAGTG 

ATGACCGTCC AGAGGGGTGC CCGGCCTGGT GTCCCCAAAG CTGTGGTGGT GCTCACAGGC 

GGGAGAGGCG CAGAGGATGC AGCCGTTCCT GCCCAGAAGC TGAGGAACAA TGGCAT CTCT 

GTCTTGGTCG TGGGCGTGGG GCCTGTCCTA AGTGAGGGTC TGCGGAGGCT TGCAGGTCCC 

CGGGATTCCC TGATCCACGT GGCAGCTTAC GCCGACCTGC GGTACCACCA GGACGTGCTC 

ATTGAGTGGC TGTGTGGAGA AGCCAAGCAG CCAGTCAACC TCTGCAAACC CAGCCCGTGC 

ATGAATGAGG GCAGCTGCGT CCTGCAGAAT GGGAGCTACC GCTGCAAGTG TCGGGATGGC 

TGGGAGGGCC CCCACTGCGA GAACCGTGAG TGGAGCTCTT GCTCTGTATG TGTGAGCCAG 

GGATGGATTC TTGAGACGCC CCTGAGGCAC ATGGCTCCCG TGCAGGAGGG CAGCAGCCGT 

ACCCCTCCCA GCAACTACAG AGAAGGCCTG GGCACTGAAA TGGTGCCTAC CTTCTGGAAT 

GTCTGTGCCC CAGGTCCTTA G 

Seq ID NO: 441 Protein sequence 
Protein Accession #: XP_061091.1 

1 11 21 31 41 51 

1 I I I 1 i 

MPNTSGTTRI EIWLLQEPPG HRALVAALLP VSPSPELALA PGYPPVPAAD DRFTLPMIGG 

QMHGEKVDLW SLGVLCYEFL VGKPPFEANE VHVSKETIGK I SAASKMMWC SAAVDIMFLL 

DGSNSVGKGS FERSKHFAIT VCDGLDISPE RVRVGAFQFS STPHLEFPLD SFSTQQEVKA 

RIKRMVFKGG RTETELALKY LLHRGLPGGR NASVPQILII VTDGKSQGDV ALPSKQLKER 

GVTVFAVGVR FPRWEELHAL ASEPRGQHVL LAEQVEDATN GLFSTLSSSA ICSSATPAGS 

PELVFMERLM GISLIGPCDS QPCQNGGTCV PEGLDGYQCL CPLAFGGEAN CALKLSLECR 

VDLLFLLDSS AGTTLDGFLR AKVFVKRFVR AVLSEDSRAR VGVAT YSREL LVAVPVGEYQ 

DVPDLVWSLD GIPFRGGPTL TGSALRQAAE RGFGSATRTG QDRPRRVWL LTESHSEDEV 

AGPARHARAR ELLLLGVGSE AVRAELEEIT GSPKHVMVYS DPQDLFNQIP ELQGKLCSRQ 

RPGCRTQALD LVFMLDTSAS VGPENFAQMQ SFVRSCALQF EVNPDVTQVG LWYGSQVQT 

AFGLDTKPTR AAMLRAISQA PYLGGVGSAG TALLHIYDKV MTVQRGARPG VPKAVWLTG 

GRGAEDAAVP AQKLRNNGIS VLWGVGPVL SEGLRRLAGP RDSLIHVAAY ADLRYHQDVL 
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IEWLCGEAKQ PVNLCKPSPC MNEGSCVLQN GSYRCKCRDG WEGPHCENRE WSSCSVCVSQ 
GWILETPLRH MAPVQEGSSR TPPSNYREGL GTEMVPTFWN VCAPGP 

Seq ID NO: 442 DNA sequence 

Nucleic Acid Accession #i Eos sequence 

Coding sequence: 1..2424 

1 11 21 31 41 51 

I l i l I i 

ATGCCCCCTT TCCTGTTGCT GGAGGCCGTC TGTGTTTTCC TGTTTTCCAG AGTGCCCCCA 
TCTCTCCCTC TCCAGGAAGT CCATGTAAGC AAAGAAACCA TCGGGAAGAT TTCAGCTGCC 
AGCAAAATGA TGTGGTGCTC GGCTGCAGTG GACATCATGT TTCTGTTAGA TGGGTCTAAC 
AGCGTCGGGA AAGGGAGCTT TGAAAGGTCC AAGCACTTTG CCAT CACAGT CTGTGACGGT 
CTGGACATCA GCCCCGAGAG GGTCAGAGTG GGAGCATTCC AGTTCAGTTC CACTCCTCAT 
CTGGAATTCC CCTTGGATTC ATTTTCAACC CAACAGGAAG TGAAGGCAAG AATCAAGAGG 
ATGGTTTTCA AAGGAGGGCG CACGGAGACG GAACTTGCTC TGAAATACCT TCTGCACAGA 
GGGTTGCCTG GAGGCAGAAA TGCTTCTGTG CCCCAGATCC TCATCATCGT CACTGATGGG 
AAGTCCCAGG GGGATGTGGC ACTGCCATCC AAG CAGCTGA AGGAAAGGGG TGTCACTGTG 
TTTGCTGTGG GGGTCAGGTT TCCCAGGTGG GAGGAGCTGC ATGCACTGGC CAGCGAGCCT 
AGAGGGCAGC ACGTGCTGTT GGCTGAGCAG GTGGAGGATG CCACCAACGG CCTCTTCAGC 
ACCCTCAGCA GCTCGGCCAT CTGCTCCAGC GCCACGCCAG ACTGCAGGGT CGAGGCT CAC 
CCCTGTGAGC ACAGGACGCT GGAGATGGTC CGGGAGTTCG CTGGCAATGC CCCATGCTGG 
AGAGGATCGC GGCGGACCCT TGCGGTGCTG GCTGCACACT GTCCCTTCTA CAGCTGGAAG 
AGAGTGTTCC TAACCCACCC TGCCACCTGC TACAGGACCA CCTGCCCAGG CCCCTGTGAC 
TCGCAGCCCT GCCAGAATGG AGGCACATGT GTT CCAGAAG GACTGGACGG CTACCAGTGC 
CTCTGCCCGC TGGCCTTTGG AGGGGAGGCT AACTGTGCCC TGAAGCTGAG CCTGGAATGC 
AGGGTCGACC TCCTCTTCCT GCTGGACAGC TCTGCGGGCA CCACTCTGGA CGGCTTCCTG 
CGGGCCAAAG TCTTCGTGAA GCGGTTTGTG CGGGCCGTGC TGAGCGAGGA CTCTCGGGCC 
CGAGTGGGTG TGGCCACATA CAGCAGGGAG CTGCTGGTGG CGGTGCCTGT GGGGGAGTAC 
CAGGATGTGC CTGACCTGGT CTGGAGCCTC GATGGCATTC CCTTCCGTGG TGGCCCCACC 
CTGACGGGCA GTGCCTTGCG GCAGGCGGCA GAGCGTGGCT TCGGGAGCGC CACCAGGACA 
GGCCAGGACC GGCCACGTAG AGTGGTGGTT TTGCTCACTG AGTCACACTC CGAGGATGAG 
GTTGCGGGCC CAGCGCGTCA CGCAAGGGCG CGAGAGCTGC TCCTGCTGGG TGTAGGCAGT 
GAGGCCGTGC GGGCAGAGCT GGAGGAGATC ACAGGCAGCC CAAAGCATGT GATGGT CT AC 
TCGGATCCTC AGGATCTGTT CAACCAAATC CCTGAGCTGC AGGGGAAGCT GTGCAGCCGG 
CAGCGGCCAG GGTGCCGGAC ACAAGCCCTG GACCTCGTCT T CATGTTGG A CACCTCTGCC 
TCAGTAGGGC CCGAGAATTT TGCTCAGATG CAGAGCTTTG TGAGAAGCTG TGCCCTCCAG 
TTTGAGGTGA ACCCTGACGT GACACAGGTC GGCCTGGTGG TGTATGGCAG CCAGGTGCAG 
ACTGCCTTCG GGCTGGACAC CAAACCCACC CGGGCTGCGA TGCTGCGGGC CATTAGCCAG 
GCCCCCTACC TAGGTGGGGT GGGCTCAGCC GGCACCGCCC TGCTGCACAT CTATGACAAA 
GTGATGACCG TCCAGAGGGG TGCCCGGCCT GGTGTCCCCA AAGCTGTGGT GGTGCTCACA 
GGCGGGAGAG GCGCAGAGGA TGCAGCCGTT CCTGCCCAGA AGCTGAGGAA CAATGGC AT C 
TCTGTCTTGG TCGTGGGCGT GGGGCCTGTC CTAAGTGAGG GTCTGCGGAG GCTTGCAGGT 
CCCCGGGATT CCCTGATCCA CGTGGCAGCT TACGCCGACC TGCGGTACCA CCAGGACGTG 
CTCATTGAGT GGCTGTGTGG AGAAGCCAAG CAGCCAGTCA ACCTCTGCAA ACCCAGCCCG 
TGCATGAATG AGGGCAGCTG CGTCCTGCAG AATGGGAGCT ACCGCTGCAA GTGTCGGGAT 
GGCTGGGAGG GCCCCCACTG CGAGAACCGT GAGTGGAGCT CTTGCTCTGT ATGTGTG AG C 
CAGGGATGGA TTCTTGAGAC GCCCCTGAGG CACATGGCTC CCGTGCAGGA GGGCAGCAGC 
CGTACCCCTC CCAGCAACTA CAGAGAAGGC CTGGGCACTG AAATGGTGCC TACCTTCTGG 
AATGTCTGTG CCCCAGGTCC TTAG 

Seq ID NO: 443 Protein sequence 
Protein Accession #: Eos sequence 

1 11 21 31 41 51 

111)11 
MPPFLLLEAV CVFLFSRVPP SLPLQEVHVS KETIGKISAA SKMMWCSAAV DIMFLLDGSN 

SVGKGSFERS KHFAITVCDG LDISPERVRV GAFQFSSTPH LEFPLDSFST QQEVKARIKR 

MVFKGGRTET ELALKYLLHR GLPGGRNASV PQILIIVTDG KSQGDVALPS KQLKERGVTV 

FAVGVRFPRW EELHALASEP RGQHVLLAEQ VEDATNGLFS TLSSSAICSS ATPD CRVEAH 

PCEHRTLEMV REFAGNAPCW RGSRRTLAVL AAHCPFYSWK RVFLTHPATC YRTTCPGPCD 

SQPCQNGGTC VPEGLDGYQC LCPLAFGGEA NCALKLSLEC RVDLLFLLDS SAGTTLDGFL 

RAKVFVKRFV RAVLSEDSRA RVGVATYSRE LLVAVPVGEY QDVPDLVWSL DGIPFRGGPT 

LTGSALRQAA ERGFGSATRT GQDRPRRVW LLTESHSEDE VAGPARHARA RELLLLGVGS 

EAVRAELEEI TGSPKHVMVY SDPQDLFNQI PELQGKLCSR QRPGCRTQAL DLVFMLDTSA 

SVGPENFAQM QSFVRSCALQ FEVNPDVTQV GLWYGSQVQ TAFGLDTKPT RAAMLRAISQ 

APYLGGVGSA GTALLHIYDK VMTVQRGARP GVPKAVWLT GGRGAEDAAV PAQKLRNNGI 

SVLWGVGPV LSEGLRRLAG PRDSLIHVAA YADLRYHQDV LIEWLCGEAK QPVNLCKPSP 

CMNEGSCVLQ NGSYRCKCRD GWEGPHCENR EWSSCSVCVS QGWILETPLR HMAPVQEGSS 

RTPPSNYREG LGTEMVPTFW NVCAPGP 

Seq ID NO: 444 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 89. ,2356 

1 11 21 31 41 51 

i ! 1 I 1 I 

GCCCCCTGGC CCGAGCCGCG CCCGGGT CTG TGAGTAGAGC CGCCCGGGCA CCGAGCGCTG 

GTCGCCGCTC TCCTTCCGTT ATATCAACAT GCCCCCTTTC CTGTTGCTGG AAGCCGTCTG 

TGTTTTCCTG TTTTCCAGAG TGCCCCCATC TCTCCCTCTC CAGGAAGTCC ATGTAAGCAA 

AG AAACCAT C GGGAAGATTT CAGCTGCCAG CAAAATGATG TGGTGCTCGG CTGCAGTGGA 

CATCATGTTT CTGTTAGATG GGT CTAACAG CGTCGGGAAA GGGAGCTTTG AAAGGTCCAA 

GCACTTTGCC ATCACAGTCT GTGACGGTCT GGACATCAGC CCCGAGAGGG TCAGAGTGGG 

AGCATTCCAG TTCAGTXCCA CTCCTCATCT GGAATTCCCC TTGGATT CAT TTTCAACCCA 

ACAGGAAGTG AAGGCAAGAA T CAAGAGG AT GGTTTTCAAA GGAGGGCGCA CGGAGACGGA 

ACTTGCTCTG AAATACCTTC TGCACAGAGG GTTGCCTGGA GGCAGAAATG CTTCTGTGCC 

CCAGATCCTC ATCAT CGTCA CTGATGGGAA GTCCCAGGGG GATGTGGCAC TGCCATCCAA 
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GCAGCTGAAG GAAAGGGGTG 
GGAGCTGCAT GCACTGGCCA 
GGAGGATGCC ACCAACGGCC 
CACGCCAGAC TGCAGGGTCG 
GGAGTTCGCT GGCAATGCCC 
TGCACACTGT CCCTTCTACA 
CAGGACCACC TGCCCAGGCC 
TCCAGAAGGA CTGGACGGCT 
CTGTGCCCTG AAGCTGAGCC 
TGCGGGCACC ACTCTGGACG 
GGCCGTGCTG AGCGAGGACT 
GCTGGTGGCG GTGCCTGTGG 
TGGCATTCCC TTCCGTGGTG 
GCGTGGCTTC GGGAG CGCCA 
GCTCACTGAG TCACACTCCG 
AGAGCTGCTC CTGCTGGGTG 
AGGCAGCCCA AAGCATGTGA 
TGAGCTGCAG GGGAAGCTGT 
CCTCGTCTTC ATGTTGGACA 
GAGCTTTGTG AGAAGCTGTG 
CCTGGTGGTG TATGGCAGCC 
GGCTGCGATG CTGCGGGCCA 
CACCGCCCTG CTGCACATCT 
TGTCCCCAAA GCTGTGGTGG 
TGCCCAGAAG CTGAGGAACA 
AAGTGAGGGT CTGCGGAGGC 
CGCCGACCTG CGGTACCACC 
GCCAGTCAAC CTCTGCAAAC 
TGGGAG CT AC CGCTGCAAGT 
CTTGAGACGC CCCTGAGGCA 
AG CAACTAC A GAGAAGGCCT 
CCAGGTCCTT AGAATGTCTG 
GAGGATGTCC CAACTGCAGC 
AAACGATGTT GTTGAAAAGT 
GCCTTGTTGA GGCTATGTCA 
GACTTAAATT TAGCGGCCTG 
TGACACAGTA ATGCCCAGCA 
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TCACTGTGTT 
GCGAGCCTAG 
TCTTCAGCAC 
AGGCTCACCC 
CATGCTGGAG 
GCTGGAAGAG 
CCTGTGACTC 
ACCAGTGCCT 
TGGAATGCAG 
GCTTCCTGCG 
CTCGGGCCCG 
GGGAGTACCA 
GCCCCACCCT 
CCAGGACAGG 
AGGATGAGGT 
TAGGCAGTGA 
TGGTCTACTC 
GCAGCCGGCA 
CCTCTGCCTC 
CCCTCCAGTT 
AGGTGCAGAC 
TTAGCCAGGC 
ATGACAAAGT 
TGCTCACAGG 
ATGGCATCTC 
TTGCAGGTCC 
AGGACGTGCT 
CCAGCCCGTG 
GTCGGGATGG 
CATGGCTCCC 
GGGCACTGAA 
CTTCCCGCCG 
CATGCTGCTT 
TTTGATGTGT 
TCTGCCACCT 
ACGTTCCTTT 
GAGGCCTTTA 



TGCTGTGGGG 
AGGGCAGCAC 
CCTCAGCAGC 
CTGTGAGCAC 
AGGATCGCGG 
AGTGTTCCTA 
GCAGCCCTGC 
CTGCCCGCTG 
GGTCGACCTC 
GGCCAAAGTC 
AGTGGGTGTG 
GGATGTGCCT 
GACGGGCAGT 
CCAGGACCGG 
TGCGGGCCCA 
GGCCGTGCGG 
GGATCCTCAG 
GCGGCCAGGG 
AGTAGGGCCC 
TGAGGTGAAC 
TGCCTTCGGG 
CCCCTACCTA 
GATGACCGTC 
CGGGAGAGGC 
TGTCTTGGTC 
CCGGGATTCC 
CATTGAGTGG 
CATGAATGAG 
CTGGGAGGGC 
GTGCAGGAGG 
ATGGTGCCTA 
TGGCCAGGAC 
AGAGACAAGA 
AAGTAAATAC 
TTCCCTTGAG 
GCACACAATC 
CTAGAGCATC 



GTCAGGTTTC 
GTGCTGTTGG 
TCGGCCATCT 
AGGACGCTGG 
CGGACCCTTG 
ACCCACCCTG 
CAGAATGGAG 
GCCTTTGGAG 
CTCTTCCTGC 
TTCGTGAAGC 
GCCACATACA 
GACCTGGTCT 
GCCTTGCGGC 
CCACGTAGAG 
GCGCGTCACG 
GCAGAGCTGG 
GATCTGTTCA 
TGCCGGACAC 
GAGAATTTTG 
CCTGACGTGA 
CTGGACACCA 
GGTGGGGTGG 
CAGAGGGGTG 
GCAGAGGATG 
GTGGGCGTGG 
CTGATCCACG 
CTGTGTGGAG 
GGCAGCTGCG 
CCCCACTGCG 
GCAGCAGCCG 
CCTTCTGGAA 
CACTATTCTC 
AAGCAGCTGA 
CCACTTTCTG 
GATAAACAAG 
AATGCTCGCC 
CTTTGGACGG 



CCAGGTGGGA 
CTGAG CAGGT 
GCTCCAGCGC 
AGATGGTCCG 
CGGTGCTGGC 
CCACCTGCTA 
GCACATGTGT 
GGGAGGCTAA 
TGGACAGCTC 
GGTTTGTGCG 
GCAGGGAGCT 
GGAGCCTCGA 
AGGCGGCAGA 
TGGTGGTTTT 
CAAGGGCGCG 
AGGAGATCAC 
ACCAAATCCC 
AAGCCCTGGA 
CTCAGATGCA 
CACAGGTCGG 
AACCCACCCG 
GCTCAGCCGG 
CCCGGCCTGG 
CAGCCGTTCC 
GGCCTGTCCT 
TGGCAGCTTA 
AAGCCAAGCA 
TCCTGCAGAA 
AGAACCGATT 
TACCCCTCCC 
TGTCTGTGCC 
ACTGAGGGAG 
TGTCACCCAC 
TACCTGCTGT 
GGGTCCTGAA 
AGAATGTTGT 



Seq ID NO: 445 Protein sequence 
Protein Accession #: Eos sequence 



55 



MPPFLLLEAV 
SVGKGSFERS 
MVFKGGRTET 
FAVGVRFPRW 
PCEHRTLEMV 
SQPCQNGGTC 
RAKVFVKRFV 
LTGSALRQAA 
EAVRAELEEI 
SVGPENFAQM 
APYLGGVGSA 
SVLWGVGPV 
CMNEGSCVLQ 



11 
I 

CVFLFSRVPP 
KHFAITVCDG 
ELALKYLLHR 
EELHALASEP 
REFAGNAPCW 
VPEGLDGYQC 
RAVLSEDSRA 
ERGFGSATRT 
TGSPKHVMVY 
QSFVRSCALQ 
GTALLH I YDK 
LSEGLRRLAG 
NGSYRCKCRD 



21 
I 

SLPLQEVHVS 
LDISPERVRV 
GLPGGRNASV 
RGQHVLLAEQ 
RGSRRTLAVL 
LCPLAFGGEA 
RVGVATYSRE 
GQDRPRRVW 
SDPQDLFNQI 
FEVNPDVTQV 
VMTVQRGARP 
PRDSLIHVAA 
GWEGPHCENR 



31 



KETIGKISAA 
GAFQFSSTPH 
PQILIIVTDG 
VEDATNGLFS 
AAHCPFYSWK 
NCALKLSLEC 
LLVAVPVGEY 
LLTESHSEDE 
PELQGKLCSR 
GLWYGSQVQ 
GVPKAVWLT 
YADLRYHQDV 
FLRRP 



41 
I 

SKMMWCSAAV 
LEFPLDSFST 
KSQGDVALPS 
TLSSSAICSS 
RVFLTHPATC 
RVDLLFLLDS 
QDVPDLVWSL 
VAGPARHARA 
QRPGCRTQAL 
TAFGLDTKPT 
GGRGAEDAAV 
LIEWLCGEAK 



51 
I 

DIMFLLDGSN 
QQEVKARIKR 
KQLKERGVTV 
ATPDCRVEAH 
YRTTCPGP CD 
SAGTTLDGFL 
DGIPFRGGPT 
RELLLLGVGS 
DLVFMLDTSA 
RAAMLRAISQ 
P AQKLRNNG I 
QPVNLCKPSP 



660 
720 
780 
S40 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 



60 



Seq ID NO: 446 DNA sequence 

Nucleic Acid Accession #: NM_031942.1 

Coding sequence: 145.. 1260 



65 



70 



75 



80 



85 



1 
I 

CCCGAGCCCC 
TGCTCCTCCT 
CCGATCTGGG 
GTAAAGAAGA 
TCCTCTGATG 
TCAGTTCGGG 
GCGATGAAGT 
CAGCCCTCAG 
AATTTTTTGG 
ATGTCTGAAT 
GACTCACAAT 
CCTGAACGGA 
GCTCTACCCA 
ACCGTGGATG 
GTGACCCTTC 
GTCTGCAGCA 
TGCCGTCAGA 
CGAGGCCAGT 
CTGCTGGATC 
CGGCAGCGAG 
TTTGGGAATG 
TATCTGGAAA 
TTTTTTCACT 
AATCAAGTTA 



11 

I 

GCCCCTCCGG 
GCTGTGGGAC 
CACCCGCCAC 
ACTTAAAGAA 
ACAGTTGTGA 
AAGGCTGTAG 
TTCCAGCGCG 
AGAATTCTGT 
AGAAAAGGGC 
TAGAAAGCTT 
CAAGGAGACC 
GAGCTCGTCC 
TGGAGGAGGA 
GCTACATGAA 
CGCATATAAT 
ATTCTCGAGA 
AGACTATTGA 
TCTGTGGCCC 
CGAACTGGCA 
ATGGACGGTG 
TGCATGCCTA 
ATTTGCTGCC 
GAAACCTGAG 
ATCTTAGCAG 



21 

I 

GCCCGGGTCG 
CGCTGACCGC 
CAGCATGGAC 
ATTCAGATAT 
CAGCTTTGCT 
GACCCGCAGC 
GAGTACCAGG 
GACTGATTCC 
TTTAAATATA 
CCCTGGCTCG 
GCGAAGGCGT 
TCTTACCAGG 
GGAGGAAGAG 
TGAAGATGAC 
TCGCCCAGTG 
GAAGATATAT 
TACCAAAACA 
CTGCCTTCGA 
TTGCCCGCCT 
TGCGACTGGG 
CTTGAAAAGC 
TGCCTTCTAC 
TTAAAAATCT 
ACATGTGTTT 



31 
I 

GCGCGCCCAG 
GCGGCTGCTC 
GCTCGCCGCG 
GTGAAGTTGA 
TCTGATAATT 
CAGTGCAGGC 
GGAGCAACCA 
AACTCCGATT 
AAGCAAAACA 
TTCCGTGGAA 
ACATTCCCGG 
TCAAGGTCCC 
GATAAGTACA 
CTGCCCAGAA 
GAAGAAATTA 
AACCGTTCAC 
AACTGCAGAA 
AACCGTTATG 
TGTCGAGGAA 
GTCCTTGTGT 
CTGAAACAGG 
TTCTCAAATC 
TGATGAT CAG 
CTGGAGCATC 



41 



CCTGCCAGCC 
CGCTCTCCCC 
TGCCGCAGAA 
TTTCCATGGA 
TTGCAAACAC 
ACTCTGGACC 
ACAAAAAAGC 
CAGAAGATGA 
AAGCAATGCT 
GACATCCCCT 
GTGTTGCTTC 
GGATCCTCGG 
TGTTGGTGAG 
GCCGTCGCTC 
CAGAGGAGGA 
TGGGCTCTAC 
ACCCAGACTG 
GTGAAGAGGT 
TCTGCAACTG 
ATTTAGCCAA 
AATTTGAAAT 
TTTCTTGTAA 
CCTGTTTCAT 
ACAGAAGGTA 



51 

1 

GCGCTGCTGC 60 

GCTCCAAGCG 12 0 

AGATCTCAGA 180 

AACCTCGTCA 240 

GAGGCTGCAG 300 

TCTCAGGGTG 360 

AGAGTCCCGC 42 0 

AAGTGGAATG 480 

TGCAAAACTC 540 

CCCAGGCTCC 600 

CAGGAGAAAC 660 

GTCCCTTGAC 720 

AAAGAGGAAG 780 

CAGATCATCC 840 

GTTGGAGAAC 900 

TTGTCATCAA 960 

CTGGGGCGTT 102 0 

CAGGGATGCT 1080 

CAGTTTCTGC 1140 

ATATCATGGC 1200 

GCAAGCATAA 12 60 

AAGTTTCCAA 1320 

AAGAAACTCC 13 80 

TATTGCTAGT 1440 
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TACACTTTGC CCTCCTGCAG 
TCTATTTCCA ATGCTCCTCT 
TATGAAAGCA TATTTTATTT 
GAAACACAAT AATAGTATTA 
CTTGTTTACA CAAAAACGAG 
TCAAGGCACA AAAGTCTTAA 
CTCTCAATCC CATGTATTGC 
CTCCTAATTT CTTCTGCCCG 
AAGGTTGGTG GGCAATGTAA 
ATGAGTAAGC TGATTTGAAT 
TTATTTCAGT TCACATGTAA 
TTGATATTAA AAACTAGTCT 
CAAGGTT CAA GTTTAGATTT 
GTAACTTTTA GCAGTTTGTT 
CTGTGTCAGT ATTCCCCCTC 
AAGTGTTTGT ATGT CCAATT 
GATGCATAAT TGGACCTTGA 
TATACAAAAG TTTATTTTAA 
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TTTCTTCTCT 
CCAACCGCTT 
ACTTGGTGTT 
ACTAACTAGA 
TATGATTTAG 
AACCATGTGG 
GCTTATGTTA 
AAGGGTAAGT 
TACTTAATTA 
TTTCAGTATA 
GGTATTGCAA 
GTGGTTCTTT 
TAAGCACTTT 
AACCTGACAT 
CTCTTTGCAT 
TACTTGCATA 
ATCGATAAGT 
TAATAAAATG 



GCTCCCAACC 
AGTTTCTGAA 
GAAATAGCCC 
TCTATTGAAT 
CACTCATACT 
AAAAATTAGG 
CAAGTTGTTG 
GGTGCGTCCA 
AAATAATGAT 
AAACTTTAGT 
ATAAATTCTT 
GCAGTTTCTT 
TATAACAATG 
CTCTGCCAGT 
TAATCAAGGT 
TGTAAACCAT 
GTAAATACAG 
TTTGTTCTAA 



CCCATCTCAT 
TTTCTTTTAA 
T CATAAAACC 
TTCAGAGAAG 
AGTTGAAATT 
TAATTATTGC 
TCACAGTTGA 
GCTTACACGA 
GGAAGAGCTA 
ATAATTGTAG 
GGACAATTTT 
GTAAATTTAT 
ATAAGTGCCT 
CTAGTTTCTG 
ATTTGGTAGA 
TGCTGTGCCA 
CTTTTGATCT 
AAAAAAAAAA 



AGCATCCCCC 1500 

ATTACAGTTT 1560 

TAAGCACTTG 1620 

AGCCTTCTAA 1680 

TTTAATAGAA 1740 

AGAT TGATGT 1800 

GACTTAATTT 1860 

TCATAATT CA 1920 

TCTGGAGATT 1980 

TTTGCAAAGT 2 040 

GTATGGAAAC 210 0 

AAACCAGGCA 2160 

TTTTGGAGAT 222 0 

GGCAGGTTTC 2280 

GGTGGAATCT 2340 

TTCAATGTTT 2400 

GTAATGCTTT 2460 



20 



Seq ID NO: 447 Protein sequence 
Protein Accession #: NP 114148.1 



11 



21 



25 



30 



MDARRVPQKD 
RSQCRHSGPL 
NIKQNKAMLA 
TRSRSRILGS 
PVEEITEEBL 
LRNRYGEEVR 
KSLKQEFEMQ 



LRVKKNLKKF 
RVAMKFPARS 
KLMSELESFP 
LDALPMEEEE 
ENVCSNSREK 
D ALLD PNWHC 
A 



RYVKLISMET 
TRGATNKKAE 
GSFRGRHPLP 
EEDKYMLVRK 
IYNRSLGSTC 
PPCRGICNCS 



31 
I 

SSSSDDSCDS 
SRQPSENSVT 
GSDSQSRRPR 
RKTVDGYMNE 
HQCRQKTIDT 
FCRQRDGRCA 



41 

I 

FASDNFANTR 
DSNSDSEDES 
RRTFPGVASR 
DDLPRSRRSR 
KTNCRNPDCW 
TGVLVYLAKY 



51 
I 

LQSVREGCRT 60 

GMNFLEKRAL 12 0 

RNPERRARPL 180 

SSVTLPHIIR 240 

GVRGQFCGPC 300 

HGFGNVHAYL 360 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



Seq ID NO; 448 DNA sequence 

Nucleic Acid Accession #: NM_019894 

Coding sequence: 1..1314 



ATGTTACAGG 
AAACCCCGTA 
CTGAGCCTGG 
TACTTCCTCT 
CTGGACTGTC 
GCAGTGGCAG 
GGGAACTGGT 
AGGCAGATGG 
GATCTGGATG 
GGGCCCTGTC 
AAGACCCCCC 
AGCATCCAGT 
CTCACGGCAG 
GGCTCAGACA 
TTCAACCCCA 
ACTTTCTCAG 
GCCACCCCAC 
GACATACTGC 
GCGTACCAGG 
GACACCTGCC 
GTGGGCATCG 
AAGGTCT CAG 



11 
1 

ATCCTGACAG 
TCCCCATGGA 
CGAGT AT CAT 
GCGGGCAGCC 
CCTTGGGGGA 
TCCGCCTCTC 
TCTCTGCCTG 
GCTACAGCAG 
TTGTTGAAAT 
TCTCAGGCTC 
GTGTGGTGGG 
ACGACAAACA 
CCCACTGCTT 
AACTGGGCAG 
TGTACCCCAA 
GCACAGTCAG 
TCTGG AT CAT 
TGCAGGCGTC 
GGGAAGTCAC 
AGGGTGACAG 
TTAGCTGGGG 
CCTATCTCAA 



21 



31 



TGATCAACCT 
GACCTTCAGA 
CATTGTGGTT 
TCTCCACTTC 
GGACGAGGAG 
CAAGGACCGA 
TTTCGACAAC 
CAAACCCACT 
CACAGAAAAC 
CCTGGTCTCC 
TGGGGAGGAG 
GCACGTCTGT 
CAGGAAACAT 
CTTCCCATCC 
AGACAATGAC 
GCCCATCTGT 
TGGATGGGGC 
AGT CCAGGTC 
CGAGAAGATG 
TGGTGGGCCC 
CTATGGCTGC 
CTGGATCTAC 



CTGAACAGCC 
AAGGTGGGGA 
GTCCTCATCA 
AT CCCGAGGA 
CACTGTGTCA 
TCCACACTGC 
TTCACAGAAG 
TTCAGAGCTG 
AGCCAGGAGC 
CTGCACTGTC 
GCCTCTGTGG 
GGAGGG AG CA 
AC CG AT GTGT 
CTGGCTGTGG 
ATCGCCCTCA 
CTGCCCTTCT 
TTTACGAAGC 
ATTGACAGCA 
ATGTGTGCAG 
CTGATGTACC 
GGGGGCCCGA 
AATGTCTGGA 



41 

1 

T CG ATGT CAA 
TCCCCATCAT 
AGGTGATTCT 
AGCAGCTGTG 
AGAGCTTCCC 
AGGTGCTGGA 
CTCTCGCTGA 
TGGAG AT TGG 
TTCGCATGCG 
TTGCCTGTGG 
ATTCTTGGCC 
TCCTGGACCC 
T CAAC TGG AA 
CCAAGAT CAT 
TGAAGCTGCA 
TTGATGAGGA 
AGAATGGAGG 
CACGGTGCAA 
GCATCCCGGA 
AATCTGACCA 
GCACCCCAGG 
AGGCTGAGCT 



51 



ACCCCTGCGC 
CATAGCACTA 
GGATAAATAC 
TGACGGAGAG 
CGAAGGGCCT 
CTCGGCCACA 
GACAGCCTGT 
CCCAGACCAG 
GAACTCAAGT 
GAAGAGCCTG 
TTGGCAGGTC 
CCACTGGGTC 
GGTGCGGGCA 
CAT CAT T G AA 
GTTCCCACTC 
GCTCACTCCA 
GAAGATGTCT 
TGCAGACGAT 
AGGGGGTGTG 
GTGGCATGTG 
AGTATACACC 
GTAA 



Seq ID NO: 449 Protein sequence 
Protein Accession #: NP_063 947.1 



MLQDPDSDQP 
YFLCGQPLHF 
GNWFSACFDN 
GPCLSGSLVS 
LTAAHCFRKH 
TFSGTVRPIC 
AYQGEVTEKM 



11 
I 

LNSLDVKPLR 
I PRKQLCDGE 
FTEALAETAC 
LHCLACGKSL 
TDVFNWKVRA 
LPFFDEELTP 
MCAGIPEGGV 



21 

I 

KPRIPMETFR 
LDCPLGEDEE 
RQMGYSSKPT 
KTPRWGGEE 
GSDKLGSFPS 
ATPLWIIGWG 
DTCQGDSGGP 



31 
i 

KVGIPIIIAti 
HCVKSFPEGP 
FRAVEIGPDQ 
ASVDSWPWQV 
LAVAKIIIIE 
FTKQNGGKMS 
LMYQSDQWHV 



41 



IiSLASIIIW 
AVAVRL SKDR 
DLDWEITEN 
SIQYDKQHVC 
FNPMYPKDND 
DILLQASVQV 
VGIVSWGYGC 



51 
I 

VLIKVILDKY 
STLQVLDSAT 
SQELRMRNSS 
GGSILDPHWV 
IALMKLQFPL 
IDSTRCNADD 
GGPSTPGVYT 



Seq ID NO: 450 DNA sequence 

Nucleic Acid Accession #: XM_0518 60.2 

Coding sequence: 52.. 3042 



GCTCACCCAG 
GTTAACCTCA 
GACCGGGGCA 
CCCAAACTCA 
AATGTACAGT 
TACCAGGCAG 



11 
I 

GAAAAATATG 
GCACCGAGGT 
GAGCCTGCCG 
CAGTCACCAT 
CATGGAAACC 
AAGAGTTCCA 



21 

I 

CAATCGTCCC 
TGTCTACAAA 
GAGCTACCGT 
TGACACCAAT 
TGGAGATACC 
GGTGCTTCCC 



31 

I 

ATTGATATAC 
AAAGGCCAGG 
GTACGGTTCC 
GTGAACAGCA 
CTGGTCATTG 
TGCAGATCCT 



41 

I 

AGGCCACTAC 
ATTATAGGTT 
TCTGTGGGAA 
CCATTCTGAA 
CCAGTACTGA 
GCGCCCCCAA 



51 
! 

AATGGATGGA 
TGCTTGCTAC 
GCCTGTGAGG 
CTTGGAGGAT 
TTACTCCATG 
CCAGGTCAAA 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 



60 
120 
180 
240 
300 
360 
420 



60 
120 
180 
240 
300 
360 



353 



WO 02/086443 

GTGGCAGGGA AACCAATGTA CCTGCACATC GGGGAGGAGA TAGACGGCGT GGACATGCGG 420 

GCGGAGGTTG GGCTTCTGAG CCGGAACATC AT AGTG AT GG GGGAGATGGA GGACAAATGC 480 

TACCCCTACA GAAACCACAT CTGCAATTTC TTTGACTTCG ATACCTTTGG GGGCCACATC 540 

AAGTTTGCTC TGGGATTTAA GGCAGCACAC TTGGAGGGCA CGGAGCTGAA GCATATGGGA 600 

CAGCAGCTGG TGGGT CAGT A CCCGATTCAC TTCCACCTGG CCGGTGATGT AGACGAAAGG 660 

GGAGGTTATG ACCCACCCAC ATACATCAGG GACCTCTCCA TCCATCATAC ATTCTCTCGC 720 

TGCGTCACAG TCCATGGCTC CAATGGCTTG TTGATCAAGG ACGTTGTGGG CTATAACTCT 780 

TTGGGCCACT GCTTCTTCAC GGAAGATGGG CCGGAGGAAG GCAACACTTT TGACCACTGT 840 

CTTGGCCTCC TTGTCAAGTC TGGAACCCTC CTCCCCTCGG ACCGTGACAG CAAGATGTGC 900 

AAGATGATCA CAGGAGACTC CTACCCAGGG TACATCCCCA AGCCCAGGCA AGACTGCAAT 960 

GCTGTGTCCA CCTTCTGGAT GGCCAATCCC AACAACAACC TCAT CAACTG TGCCGCTGCA 1020 

GGATCTGAGG AAACTGGATT TTGGTTTATT TTT CACCACG TACCAACGGG CCCCTCCGTG 1080 

GGAATGTACT CCCCAGGTTA TTCAGAGCAC ATTCCACTGG GAAAATTCTA TAACAACCGA 1140 

GCACATTCCA ACTACCGGGC TGGCATGATC ATAGACAA CG GAGTCAAAAC CACCGAGGCC 1200 

TCTGCCAAGG ACAAGCGGCC GTTCCTCTCA ATCATCTCTG CCAGATACAG CCCTCACCAG 1260 

GACGCCGACC CGCTGAAGCC CCGGGAGCCG GCCATCATCA GACACTTCAT TGCCTACAAG 1320 

AACCAGGACC ACGGGGCCTG GCTGCGCGGC GGGGATGTGT GGCTGGACAG CTGCCGGTTT 13 80 

GCTGACAATG GCATTGGCCT GACCCTGGCC AGTGGTGGAA CCTTCCCGTA TGACGACGGC 1440 

TCCAAGCAAG AGATAAAGAA CAGCTTGTTT GTTGGCGAGA GTGGCAACGT GGGGA CGGAA 1500 

ATGATGGACA ATAGGATCTG GGGCCCTGGC GGCTTGGACC ATAGCGGAAG GACCCTCCCT 1560 

ATAGGCCAGA ATTTTCCAAT TAGAGGAATT CAGTTATATG ATGGCCCCAT CAACATCCAA 162 0 

AACTGCACTT TCCGAAAGTT TGTGGCCCTG GAGGGCCGGC ACACCAGCGC CCTGGCCTTC 1680 

CGCCTGAATA ATGCCTGGCA GAGCTGCCCC CATAACAACG TGACCGGCAT TGCCTTTGAG 1740 

GACGTTCCGA TTACTTCCAG AGTGTTCTTC GGAGAGCCTG GGCCCTGGTT CAACCAGCTG 1800 

GACATGGATG GGGATAAGAC ATCTGTGTTC CATGACGTCG ACGGCTCCGT GTCCGAGTAC 1860 

CCTGGCTCCT ACCTCACGAA GAATGACAAC TGGCTGGTCC GGCACCCAGA CTGCAT CAAT 1920 

GTTCCCGACT GGAGAGGGGC CATTTGCAGT GGGTGCTATG CACAGAT GT A CATTCAAGCC 1980 

TACAAGACCA GTAACCTGCG AATGAAGATC ATCAAGAATG ACTTCCCCAG CCACCCTCTT 2040 

TACCTGGAGG GGGCGCTCAC CAGGAGCACC CATTACCAGC AATACCAACC GGTTGTCACC 210 0 

CTGCAGAAGG GCTACACCAT CCACTGGGAC CAGACGGCCC CCGCCGAACT CGCCATCTGG 2160 

CTCATCAACT TCAACAAGGG CGACTGGATC CGAGTGGGGC TCTGCTACCC GCGAGGCACC 2220 

ACATTCTCCA TCCTCTCGGA TGTTCACAAT CGCCTGCTGA AGCAAACGTC CAAGACGGGC 2280 

GTCTTCGTGA GGACCTTGCA GATGGACAAA GTGGAGCAGA GCTACCCTGG CAGGAGCCAC 2340 

TACTACTGGG ACGAGGACTC AGGGCTGTTG TTCCTGAAGC TGAAAGCTCA GAACGAGAGA 2400 

GAGAAGTTTG CTTTCTGCTC CATGAAAGGC TGTGAGAGGA TAAAGATTAA AGCTCTGATT 2460 

CCAAAGAACG CAGGCGT CAG TGACTGCACA GCCACAGCTT ACCCCAAGTT CACCGAGAGG 2520 

GCTGTCGTAG ACGTGCCGAT GCCCAAGAAG CTCTTTGGTT CTCAGCTGAA AACAAAG G AC 2580 

CATTTCTTGG AGGTGAAGAT GGAGAGTTCC AAGCAGCACT TCTTCCACCT CTGGAACGAC 2 640 

TTCGCTTACA TTGAAGTGGA TGGGAAGAAG TACCCCAGTT CGGAGGATGG CATCCAGGTG 270 0 

GTGGTGATTG ACGGGAACCA AGGGCGCGTG GTGAGCCACA CGAGCTT CAG GAACTCCATT 2760 

CTGCAAGGCA TACCATGGCA GCTTTTCAAC TATGTGGCGA CCATCCCTGA CAATTCCATA 2 82 0 

GTGCTTATGG CATCAAAGGG AAGATACGTC TCCAGAGGCC CATGGACCAG AGTGCTGGAA 2 880 

AAGCTTGGGG CAGACAGGGG TCTCAAGTTG AAAGAGCAAA TGGCATTCGT TGGCTTCAAA 2 940 

GGCAGCTTCC GGCCCATCTG GGTGACACTG GACACTGAGG ATCACAAAGC CAAAATCTTC 3 000 

CAAGTTGTGC CCATCCCTGT GGTGAAGAAG AAGAAGTTGT GAGGACAGCT GCCGCCCGGT 3 060 

GCCACCTCGT GGTAGACTAT GACGGTGACT CTTGGCAGCA GACCAGTGGG GGATGGCTGG 3120 

GTCCCCCAGC CCCTGCCAGC AGCTGCCTGG GAAGGCCGTG TTTCAGCCCT GATGGGCCAA 3180 

GGGAAGGCTA TCAGAGACCC TGGTGCTGCC ACCTGCCCCT ACT CAAGTGT CTACCTGGAG 3240 

CCCCTGGGGC GGTGCTGGCC AATGCTGGAA ACATTCACTT TCCTGCAGCC TCTTGGGTGC 3300 

TTCTCTCCTA TCTGTGCCTC TTCAGTGGGG GTTTGGGGAC CATATCAGGA GACCTGGGTT 3 3 60 

GTGCTGACAG CAAAGATCCA CTTTGGCAGG AGCCCTGACC CAGCTAGGAG GTAGTCTGGA 3 420 

GGGCTGGTCA TTCACAGATC CCCATGGTCT TCAGCAGACA AGTG AGGGT G GTAAAT GT AG 3 48 0 

GAGAAAGAGC CTTGGCCTTA AGGAAATCTT TACTCCTGTA AGCAAGAGCC AACCTCACAG 3 540 

GATTAGGAGC TGGGGTAGAA CTGGCTATCC TTGGGGAAGA GGCAAGCCCT GCCTCTGGCC 3 60 0 

GTGTCCACCT TTCAGGAGAC TTTGAGTGGC AGGTTTGGAC TTGGACTAGA TGACTCTCAA 3 660 

AGGCCCTTTT AGTTCTGAGA TTCCAGAAAT CTGCTGCATT TCACATGGTA CCTGGAACCC 3 72 0 

AACAGTTCAT GGAT AT CCAC TGATATCCAT GATGCTGGGT GCCCCAGCGC ACACGGGATG 3780 

GAGAGGTGAG AACTAATGCC TAGCTTGAGG GGTCTGCAGT CCAGTAGGGC AGGCAGTCAG 3840 

GTCCATGTGC ACTGCAATGC CAGGTGGAGA AATCACAGAG AGGTAAAATG GAGGCCAGTG 3 900 

CCATTTCAGA GGGGAGGCTC AGGAAGGCTT CTTGCTTACA GGAATGAAGG CTGGGGGCAT 3 960 

TTTGCTGGGG GGAGATGAGG CAGCCTCTGG AATGGCTCAG GGATTCAGCC CTCCCTGCCG 4020 

CTGCCTGCTG AAGCTGGTGA CTACGGGGTC GCCCTTTGCT CACGTCTCTC TGGCCCACTC 4 0 80 

ATGATGGAGA AGTGTGGTCA GAGGGGAGCA ATGGGCTTTG CTGCTTATGA GCACAGAGGA 414 0 

ATTCAGTCCC CAGGCAGCCC TGCCTCTGAC TCCAAGAGGG TGAAGTCCAC AGAAGTGAGC 42 0 0 

TCCTGCCTTA GGGCCTCATT TGCTCTTCAT CCAGGGAACT GAGCACAGGG GGCCTCCAGG 42 60 

AGACCCTAGA TGTGCTCGTA CTCCCTCGGC CTGGGATTTC AGAGCTGGAA ATATAGAAAA 432 0 

TATCTAGCCC AAAGCCTTCA TTTTAACAGA TGGGGAAAGT GAGCCCCCAA GATGGGAAAG 43 80 

AACCACACAG CTAAGGGAGG GCCTGGGGAG CCCCACCCTA GCCCTTGCTG CCACACCACA 4440 

TTGCCTCAAC AACCGGCCCC AGAGTGCCCA GGCACTCCTG AGGTAGCTTC TGGAAATGGG 450 0 

GACAAGTCCC CTCGAAGGAA AGGAAATGAC TAGAGTAGAA TGACAGCTAG CAGATCTCTT 4560 

CCCTCCTGCT CCCAGCGCAC ACAAACCCGC CCTCCCCTTG GTGTTGGCGG TCCCTGTGGC 462 0 

CTTCACTTTG TTCACTACCT GTCAGCCCAG CCTGGGTGCA CAGTAGCTGC AACTCCCCAT 4680 

TGGTGCTACC TGGCTCTCCT GTCTCTGCAG CTCTACAGGT GAGGCCCAGC AGAGGGAGTA 4740 

GGGCTCGCCA TGTTTCTGGT GAGCCAATTT GGCTGATCTT GGGTGTCTGA ACAGCTATTG 4800 

GGTCCACCCC AGTCCCTTTC AGCTGCTGCT TAATGCCCTG CTCTCTCCCT GGCCCACCTT 48 60 

ATAGAGAGCC CAAAGAGCTC CTGTAAGAGG GAGAACTCTA TCTGTGGTTT ATAATCTTGC 4 920 

ACGAGGCACC AGAGTCTCCC TGGGTCTTGT GATGAACTAC ATTTATCCCC TTTCCTGCCC 4 980 

CAACCACAAA CTCTTTCCTT CAAAGAGGGC CTGCCTGGCT CCCTCCACCC AACTGCACCC 5 040 

ATGAG ACT CG GTCCAAGAGT CCATTCCCCA GGTGGGAGCC AACTGTCAGG GAGGTCTTTC 5100 

CCACCAAACA TCTTTCAGCT GCTGGGAGGT GACCATAGGG CTCTGCTTTT AAAGATATGG 5160 

CTGCTTCAAA GGCCAGAGTC ACAGGAAGGA CTTCTTCCAG GGAGATTAGT GGTGATGGAG 522 0 

AGGAGAGTTA AAATGACCTC ATGTCCTTCT TGT CCACGGT TTTGTTGAGT TTTCACTCTT 52 80 

CTAATGCAAG GGTCTCACAC TGTGAACCAC TTAGGATGTG ATCACTTTCA GGTGGCCAGG 5340 

AATGTTGAAT GTCTTTGGCT CAGTTCATTT AAAAAAGATA TCTATTTGAA AGTTCTCAGA 540 0 

GTTGTACATA TGTTTCACAG TACAGGATCT GTACATAAAA GTTTCTTTCC TAAACCATTC 5460 

ACCAAGAGCC AATATCTAGG CATTTTCTTG G TAG CACAAA TTTTCTTATT GCTTAGAAAA 5520 

TTGTCCTCCT TGTTATTTCT GTTTGTAAGA CTTAAGTGAG TTAGGTCTTT AAGGAAAGCA 5580 



354 



WO 02/086443 

ACGCTCCTCT GAAATGCTTG TCTTTTTTCT GTTGCCGAAA TAGCTGGTCC TTTTTCGGGA 5640 
GTTAGATGTA TAGAGTGTTT GTATGTAAAC ATTT CTTGTA GGCATCACCA TGAACAAAGA 5700 
TATATTTTCT ATTTATTTAT TATATGTGCA CTT CAAGAAG TCACTGTCAG AGAAATAAAG 5760 
AATTGTCTTA AATGTCAAAA AAAAAAAAAA AAAAAAAAAA AAAAAAAA 



PCT/US02/12476 



Seq ID NO; 451 Protein sequence 
Protein Accession #: XP 051860.2 
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MDGVNLSTEV 
LEDNVQSWKP 
DMRAEVGLLS 
HMGQQLVGQY 
YNSLGHCFFT 
DCNAVSTFWM 
NNRAHSNYRA 
AYKNQDHGAW 
GTEMMDNRIW 
LAFRLNNAWQ 
SEYPGSYLTK 
HPLYLEGALT 
RGTTFSILSD 
NEREKFAFCS 
TKDHFLEVKM 
NSILQGIPWQ 
GFKGSFRPIW 



11 
I 

VYKKGQDYRF 
GDTLVIASTD 
RNIIVMGEME 
PIHFHDAGDV 
EDGPEERNTF 
ANPNNNLINC 
GMI IDNGVKT 
LRGGDVWLDS 
GPGGLDHSGR 
SCPHNNVTGI 
NDNWLVRHPD 
RSTHYQQYQP 
VHNRIjLKQTS 
MKGCERIKIK 
ESSKQHFFHL 
IiFNYVATIPD 
VTLDTEDHKA 



21 
I 

ACYDRGRACR 
YSMYQAEEFQ 
DKCYPYRNHI 
DERGGYDPPT 
DHCLGLLVKS 
AAAGSEETGF 
TEASAKDKRP 
CRFADNGIGL 
TLPIGQNFPI 
AFEDVPITSR 
CINVPDWRGA 
WTLQKGYTI 
KTGVFVRTLQ 
ALIPKNAGVS 
WNDFAYIEVD 
NS I VLMASKG 
KIFQWPIPV 



31 



SYRVRFLCGK 
VLPCRSCAPN 
CNFFDFDTFG 
YIRDLSIHKT 
GTLLPSDRDS 
WFIFHHVPTG 
FLSIISARYS 
TLASGGTFPY 
RGIQLYDGPI 
VFFGEPGPWF 
I CSGCYAQMY 
HWDQTAPAEL 
MDKVEQSYPG 
DCTATAYPKF 
GKKYPSSEDG 
RYVSRGPWTR 
VKKKKL 



41 

I 

PVRPKLTVTI 
QVKVAGKPMY 
GH I KFALGFK 
FSRCVTVHGS 
KMCKMITGDS 
PSVGMYSPGY 
PHQDADPLKP 
DDGSKQEIKN 
NIQNCTFRKF 
NQLDMDGDKT 
IQAYKTSNLR 
AIWLINFNKG 
RSHYYWDEDS 
TERAWDVPM 
IQVWIDGNQ 
VLEKLGADRG 



51 
I 

DTNVNSTILN 
LHIGEEIDGV 
AAHLEGTELK 
NGLiLIKDWG 
YPGYIPKPRQ 
SEHIPLGKFY 
REPAIIRHFI 
SLFVGESGNV 
VALEGRHT S A 
SVFHDVDGSV 
MKI IKNDFPS 
DWIRVGLCYP 
GLLFIiKLKAQ 
PKKLFGSQLK 
GRWSHTSFR 
LKLKEQMAFV 



Seq ID NO: 452 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 261.. 2861 



85 



GAGCTAGCGC 
CGGCGCGGGG 
AGCTACCACT 
ACGTCCGGGG 
AGAGGGAGCA 
TGCTGACCAT 
CTGGGTGCCC 
ACCATGTGCA 
CCATCCACAT 
TGCGAACCCG 
GCCCTTTCCA 
CGGATCCTTA 
ATGGACAGAA 
CAGAAGGAGG 
TCGACCCCAA 
AAGAGAGTGA 
TTGCAGTGAA 
AATTGGGAAG 
TGAAAGGAAA 
CTGCTGCTGC 
CTTTGTCCAG 
TAT CTCAGAC 
TATGCAATCG 
AGGTTGTCTA 
GCCGGAGCTA 
CCATTGACAC 
AACCTGGAGA 
TCCAGGTGCT 
TGTACCTGCA 
TGAGCCGGAA 
ACATCTGCAA 
TTAAGGCAGC 
AGTACCCGAT 
CCACATACAT 
GCTCCAATGG 
TCACGGAAGA 
AGTCTGGAAC 
ACTCCTACCC 
GGATGGCCAA 
GATTTTGGTT 
GTTATTCAGA 
GGGCTGGCAT 
GGCCGTTCCT 
AGCCCCGGGA 
CCTGGCTGCG 
AAGGCTTCTT 
CCT CTGGAAT 
CGGGGTCGCC 
GGGAGCAATG 
CTCTGACTCC 
TCTTCATCCA 
CCTCGGCCTG 



11 
1 

TCAAGCAGAG 
AGCCAGCGGG 
CCGCTTGCCC 
CCGCTGCGCT 
CACTGCCAGG 
CAGCTGGCTC 
TGACCAGAGC 
TATCGGCCAG 
CTCAGAGGGA 
GCACATCCTG 
GGGCAATTTC 
CTATGGTCTG 
AAAGCTCTCC 
CTATTTTTTT 
ATCAGGCACA 
ACGTCTGGTC 
TGATGAAGGT 
CAAACACTTC 
TCCATCATCT 
CCGGGTATTC 
TGAGTGGGTT 
TAAAGGTGGG 
TCCCATTGAT 
CAAAAAAGGC 
CCGTGTAGGG 
CAATGTGAAC 
TACCCTGGTC 
TCCCTGCAGA 
CATCGGGGAG 
CATCATAGTG 
TTTCTTTGAC 
ACACTTGGAG 
TCACTTCCAC 
CAGGGACCTC 
CTTGTTGATC 
TGGGCCGGAG 
CCTCCTCCCC 
AGGGTACATC 
TCCCAACAAC 
TATTTTTCAC 
GCACATTCCA 
GATCATAGAC 
CTCAATCATC 
GCCGGCCATC 
CGGCGGGGAT 
GCTTACAGGA 
GGCTCAGGGA 
CTTTGCTCAC 
GGCTTTGCTG 
AAGAGGGTGA 
GGGAACTGAG 
GGATTTCAGA 



21 
1 

CCCAGCGCGG 
GCTGAGCGCG 
ACGCCCCGGG 
CCTGGCCCGC 
ATGGGAGCTG 
ACTCTGACCT 
CCTGAGTTGC 
GGCAAGACAC 
GGCAAGCTGG 
ATTGACAACG 
ACCAT CATTT 
AAGTACATTG 
TGGACATTTC 
GAAAGGAGCT 
GTCATCCATT 
CAGTATTTGA 
TCTCGAAATC 
CTGCACCTTG 
TCAGTGGAAG 
AAATTGTTCC 
CAAGACGTGG 
GAG AAAAT TT 
ATACAGGCCA 
CAGGATTATA 
TTCCTCTGTG 
AGCACCATTC 
ATTGCCAGTA 
TCCTGCGCCC 
GAGATAGACG 
ATGGGGGAGA 
TTCGATACCT 
GGCACGGAGC 
CTGGCCGGTG 
TCCATCCATC 
AAGGACGTTG 
GAACGCAACA 
TCGGACCGTG 
CCCAAGCCCA 
AACCTCATCA 
CACGTACCAA 
CTGGGAAAAT 
AACGGAGTCA 
TCTGCCAGAT 
ATCAGACACT 
GTGTGGCTGG 
ATGAAGGCTG 
TTCAGCCCTC 
GTCTCTCTGG 
CTTATGAGCA 
AGTCCACAGA 
CACAGGGGGC 
GCTGGAAATA 



31 
I 

TGCTATCGGA 
GCCAGGGTCT 
AGCTCGCGGC 
GAGGCGTGAC 
CTGGGAGGCA 
GCTTCCCTGG 
AACCCTGGAA 
TGCTGCTCAC 
TCATTAAAGA 
GAGGAGAGCT 
TGTATGGAAG 
GGGTTGGTAA 
TGAACAAGAC 
GGGGCCACCG 
CTGACCGGTT 
ACGCGGTGCC 
TGGATGACAT 
GATTTAGACA 
ACCATATTGA 
AGACAGAGCA 
AGTGGACGGA 
CAGACCTCTG 
CTACAATGGA 
GGTTTGCTTG 
GGAAGCCTGT 
TGAACTTGGA 
CTGATTACTC 
CCAACCAGGT 
GCGTGGACAT 
TGGAGGACAA 
TTGGGGGCCA 
TGAAGCATAT 
ATGTAGACGA 
ATACATTCTC 
TGGGCTATAA 
CTTTTGACCA 
ACAGCAAGAT 
GGCAAGACTG 
ACTGTGCCGC 
CGGGCCCCTC 
TCTATAACAA 
AAACCACCGA 
ACAGCCCTCA 
TCATTGCCTA 
ACAGCTGCCA 
GGGGCATTTT 
CCTGCCGCTG 
CCCACTCATG 
CAGAGGAATT 
AGTGAGCTCC 
CTCCAGGAGA 
TAGAAAATAT 



41 

1 

CAGAGCCTGG 
GAACCCAGAT 
GCCTGGCGGT 
ACTGTCTCGG 
GGACTTCCTC 
GGCCACATCC 
CCCTGGCCAT 
CTCTTCTGCC 
CCACGA CGAG 
GCATGCTGGG 
GGCTGATGAA 
AGGAGG CGCT 
CCTTCACCCA 
TGGAGTTATT 
TGACACCTAT 
CGATGGCAGG 
GGCCAGGAAG 
CCCTTGGAGT 
ATATCATGGA 
TGGCGAATAT 
GTGGTTCGAT 
GAAAGCTCAC 
TGGAGTTAAC 
CTACGACCGG 
GAGGCCCAAA 
GGATAATGTA 
CATGTACCAG 
C AAAGTGG C A 
GCGGGCGGAG 
ATGCTACCCC 
CATCAAGTTT 
GGGACAGCAG 
AAG GGGAGGT 
TCGCTGCGTC 
CTCTTTGGGC 
CTGTCTTGGC 
GTGCAAGATG 
CAATGCTGTG 
TGCAGGATCT 
CGTGGGAATG 
CCGAGCACAT 
GGCCTCTGCC 
CCAGGACGCC 
CAAGAACCAG 
TTTCAGAGGG 
GCTGGGGGGA 
CCTGCTGAAG 
ATGGAGAAGT 
CAGTCCCCAG 
TGCCTTAGGG 
CCCTAGATGT 
CTAGCCCAAA 



51 

I 

CGAGCGCAAG 
TTCCCAGACT 
CAGCGACCAG 
CTACAGACCC 
TTCAAGGCCA 
ACAGTGGCTG 
GACCAAGACC 
ACGGTCTATT 
CCGATTGTTT 
AGTGCCCTCT 
GGTATTCAGC 
CTTGAGTTGC 
GGTGG CATGG 
GTTCATGTCA 
AGATCCAAGA 
ATCCTTTCTG 
GCGATGACCA 
TTTCTAACTG 
CATCGAGGCT 
TTCAATGTTT 
CATGATAAAG 
CCAGGAAAAA 
CTCAGCACCG 
GGCAGAGCCT 
CTCACAGTCA 
CAGT CATGGA 
GCAGAAGAGT 
GGGAAACCAA 
GTTGGGCTTC 
TACAGAAACC 
GCTCTGGGAT 
CTGGTGGGTC 
TATGACCCAC 
ACAGTCCATG 
CACTGCTTCT 
CTCCTTGTCA 
AT CACAGAGG 
TCCACCTTCT 
GAGGAAACTG 
TACTCCCCAG 
TCCAACTACC 
AAGGACAAGC 
GACCCGCTGA 
GACCACGGGG 
GAGGCTCAGG 
GATGAGGCAG 
CTGGTGACTA 
GTGGTCAGAG 
GCAGCCCTGC 
CCTCATTTGC 
GCTCGTACTC 
GCCTTCATTT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 



355 



10 



15 



20 



25 



WO 02/086443 

T AAC AG AT G G GGAAAGTGAG 
TGGGGAGCCC CACCCTAGCC 
GTGCCCAGGC ACTCCTGAGG 
AAATGACTAG AGTAGAATGA 
AACCCGCCCT CCCCTTGGTG 
AGCCCAGCCT GGGTG C ACAG 
TCTGCAGCTC TACAGGTGAG 
CCAATTTGGC TGATCTTGGG 
TGCTGCTTAA TGCCCTGCTC 
TAAGAGGGAG AACTCTATCT 
GTCTTGTGAT GAACTACATT 
AGAGGGCCTG CCTGGCTCCC 
TTCCCCAGGT GGGAGCCAAC 
GGGAGGTGAC CATAGGGCTC 
GGAAGGACTT CTT CCAGGG A 
TCCTTCTTGT CCACGGTTTT 
GAACCACTTA GGATGTGATC 
TTCATTTAAA AAAGATATCT 
AGGATCTGTA CATAAAAGTT 
TTTCTTGGTA GCACAAATTT 
TGTAAGACTT AAGTGAGTTA 
TTTTTCTGTT GCCGAAATAG 
TGTAAACATT TCTTGTAGGC 
ATGTGCACTT CAAGAAGTCA 
GAGATGTCCT TTGCATTGCT 
TTGGAAAAAT TTTGCTGTTA 
AAAAAAAAAA AAAAAAAAAA 



CCCCCAAGAT 
CTTGCTGCCA 
TAGCTTCTGG 
CAGCTAGCAG 
TTGGCGGTCC 
TAGCTGCAAC 
GCCCAGCAGA 
TGTCTGAACA 
TCTCCCTGGC 
GTGGTTTATA 
TATCCCCTTT 
TCCACCCAAC 
TGTCAGGGAG 
TGCTTTTAAA 
GATTAGTGGT 
GTTGAGTTTT 
ACTTTCAGGT 
ATTTGAAAGT 
TCTTTCCTAA 
TCTTATTGCT 
GGTCTTTAAG 
CTGGTCCTTT 
ATCACCATGA 
CTGTCAGAGA 
TGGAAGGGGT 
TTATAGTAAA 
AA 



GGGAAAGAAC 
CACCACATTG 
AAATGGGGAC 
ATCTCTTCCC 
CTGTGGCCTT 
TCCCCATTGG 
GGGAGTAGGG 
GCTATTGGGT 
CCACCTTATA 
ATCTTGCACG 
CCTGCCCCAA 
TGCACCCATG 
GTCTTTCCCA 
GATATGGCTG 
GATGGAGAGG 
CACTCTTCTA 
GGCCAGGAAT 
TCTCAGAGTT 
ACCATTCACC 
TAGAAAATTG 
GAAAGCAACG 
TTCGGGAGTT 
ACAAAGATAT 
AATAAAGAAT 
GTACCTAGAG 
CATACAAAGG 



CACACAGCTA 
CCTCAACAAC 
AAGTCCCCTC 
TCCTGCTCCC 
CACTTTGTTC 
TGCTACCTGG 
CTCGCCATGT 
CCACCCCAGT 
GAGAGCCCAA 
AGGCACCAGA 
CCACAAACTC 
AGACTCGGTC 
CCAAACATCT 
CTTCAAAGGC 
AGAGTTAAAA 
ATGCAAGGGT 
GTTGAATGTC 
GTACATATGT 
AAGAGCCAAT 
TCCTCCTTGT 
CTCCTCTGAA 
AGATGTATAG 
ATTTTCTATT 
TGTCTTAAAT 
CCAAGGAAAT 
ATGTCAAAAA 



AGGGAGGGCC 3180 

CGGCCCCAGA 3240 

GAAGGAAAGG 33 00 

AGCGCACACA 33 60 

ACTACCTGTC 342 0 

CTCTCCTGTC 3 480 

TTCTGGTGAG 3 54 0 

CCCTTTCAGC 3 600 

AGAGCTCCTG 3 660 

GTCTCCCTGG 3 72 0 

TTTCCTTCAA 3780 

CAAGAGTCCA 3 840 

TTCAGCTGCT 3 90 0 

CAGAGTCACA 3 960 

TGACCTCATG 4020 

CTCACACTGT 4080 

TTTGGCTCAG 4140 

TT CACAGT AC 42 0 0 

AT C TAGG CAT 42 60 

TATTTCTGTT 432 0 

ATGCTTGTCT 43 80 

AGTGTTTGT A 4440 

TATTTATTAT 450 0 

GTCATGATTG 4560 

TGGCTCTGGT 462 0 

AAAAAAAAAA 4680 



PCT/US02/12476 



30 



Seq ID NO: 453 Protein sequence 
Protein Accession #: Eos sequence 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



MGAAGRQDFL 
GKTLIiLTSSA 
TIILYGRADE 
ERSWGHRGVI 
SRNLDDMARK 
KLFQTEHGEY 
IQATTMDGVN 
STILNLEDNV 
EIDGVDMRAE 
GTELKHMGQQ 
KDWGYNSLG 
PKPRQDCNAV 
LGKFYNNRAH 
IRHFIAYKNQ 
FSPPCRCLLK 



11 
I 

FKAMLTISWL 
TVYSIHISEG 
GIQPDPYYGL 
VHVIDPKSGT 
AMTKLGSKHF 
FNVSLSSEWV 
LSTEWYKKG 
QSWKPGDTLV 
VGLLSRNI IV 
LVGQYPIHFH 
HCFFTEDGPE 
STFWMANPNN 
SNYRAGMIID 
DHGAWLRGGD 
LVTTGSPFAH 



21 
I 

TLTCFPGATS 
GKLVIKDHDE 
KY I GVGKGG A 
VIHSDRFDTY 
LHLGFRHPWS 
QDVEWTEWFD 
QDYRFACYDR 
IASTDYSMYQ 
MGEMEDKCYP 
LAGDVDERGG 
ERNTFDHCLG 
NLINCAAAGS 
NGVKTTEASA 
VWLDSCHFRG 
VSLAHS 



31 

TVAAGCPDQS 
PIVLRTRHIL 
LELHGQKKLS 
RSKKESERLV 
FLTVKGNPSS 
HDKVSQTKGG 
GRACRSYRVR 
AEEFQVLPCR 
YRNHICNFFD 
YDPPTYIRDL 
LLVKSGTLLP 
EETGFWFIFH 
KDKRPFLSII 
EAQEGFLLTG 



41 



51 



PELQPWNPGH 
IDNGGELHAG 
WTFLNKTLHP 
QYLNAVPDGR 
SVEDHIEYHG 
EKISDLVJKAH 
FLCGKPVRPK 
SCAPNQVKVA 
FDTFGGHIKF 
SIHHTFSRCV 
SDRDSKMCKM 
HVPTGPSVGM 
SARYSPHQDA 
MKAGGILLGG 



DQDHHVH I GQ 60 

SALCPFQGNF 120 

GGMAEGGYFF 180 

I L S VAVNDEG 240 

HRG S AAARVF 3 00 

PGKICNRPID 3 60 

LTVTIDTNVN 42 0 

GKPMYLHIGE 480 

ALGFKAAHLE 540 

TVHGSNGLLI 600 

ITEDSYPGYI 660 

YSPGYSEHIP 72 0 

DPLKPREPAI 780 

DEAASGMAQG 840 



Seq ID NO: 454 DNA sequence 

Nucleic Acid Accession #: NM_013282.2 

Coding sequence: 85. .2466 



85 



1 
I 

CGACTCCTTA 
GTCCCTCCCC 
ACCCACACGG 
CAGGAGCTGT 
GAGGACGGCC 
GTCCGCCAGA 
ACCGACTCCG 
GCGGCCGCCG 
GGGCTGTACA 
GAGGCGCAGG 
ACGTCCAGGC 
GAGAACGGCG 
AAGTGGCAGG 
AAGGAGCGGG 
CGGGAACTCT 
TTCGTGGACG 
CCCATGAGAC 
TGCCGGGTCT 
TGCGATGAGT 
CCCAGCGAGG 
GCGGGAGAGC 
TCACAGCGGG 
GTCCCGTCCA 
CGAGTCCAGG 
AG CAACGACG 
GGGAATTTTT 
GCGGAACAGT 
TTTGCTCCCA 
GTCAGGGTGG 
AACCGCTACG 
TTTCTCGTGT 
GAGGGGAAGG 



11 

1 

GAGCATGGCA 
TCAGCGCCGA 
TGGACTCGCT 
TCCACGTGGA 
ATACCCTCTT 
GCCTCGTGCT 
GCTGCTGCCT 
AGACTGACAG 
AGGTCAATGA 
TGGTCAGGGT 
CGGCGCTGGA 
TGGTCCAGAT 
ACCTGGAGGT 
GCTTCTGGTA 
ACGCCAACGT 
AAGTCTTCAA 
GGAAGAG CGG 
GCGCCTGCCA 
GCGACATGGC 
ACGAGTGGTA 
GGCTGAGAGA 
ACTGGGGCAA 
ACCACTACGG 
TCAGCGAGTC 
GAGCGTACTC 
TCACATACAC 
CTTGTGATCA 
TCAATGACCA 
TGCGCAATGT 
ATGGCATCTA 
GGCGCTACCT 
ACCGGATCAA 



21 



TGGCTCAGAG 
CACCATGTGG 
GTCCAGGCTG 
GCCAGGCCTG 
CGACTACGAG 
CCCCCACAGC 
GGGCCAGAGT 
CAGGCCAGCC 
GTACGTCGAT 
GACGCGGAAG 
GGAGGACGTC 
GAACT CCAGG 
GGGCCAGGTG 
CGACGCGGAG 
GGTGCTGGGG 
GATTGAGCGG 
GCCGTCCTGC 
CCTGTGCGGG 
CTTCCACATC 
CTGCCCTGAG 
GAGCAAGAAG 
GGGCATGGCC 
ACCCATCCCG 
GGGTGTCCAT 
CCTAGTCCTG 
GGGTAGTGGT 
GAAACTCACC 
AGAAGGGGCC 
CAAGGGTGGC 
CAAGGTTGTG 
TCTGCGGAGG 
GAAGCTGGGG 



31 

I 

GTGCTGGTAA 
ATCCAGGTTC 
ACCAAGGTGG 
CAGAGGCTGT 
GTCCGCCTGA 
ACCAAGGAGC 
GAGTCAGACA 
GATGAGGACA 
GCTCGGGACA 
GCCCCCTCCC 
ATTTACCACG 
GACGTCCGAG 
GTCATGCTCA 
AT CTCCAGGA 
GATGATTCTC 
CCGGGTGAAG 
AAGCACTGCA 
GGCCGGCAGG 
TACTGCCTGG 
TGCCGGAATG 
AAGGCGAAGA 
TGTGTGGGCC 
GGGATCCCCG 
CGGCCCCACG 
GCGGGGGGCT 
GGTCGAGATC 
AACACCAACA 
GAGGCCAAGG 
AAGAATAGCA 
AAATACTGGC 
GACGATGATG 
CTGACCATGC 



41 
I 

AACTGATGGG 
GGACCATGGA 
AGGAGCTGAG 
TCTACAGGGG 
ATGACACCAT 
GGGACTCCGA 
AGTCCTCCAC 
TGTGGGATGA 
CGAACATGGG 
GGGACGAGCC 
TGAAATACGA 
CGCGCGCCCG 
ACTACAACCC 
AGCGCGAGAC 
TGAACGACTG 
GGAGCCCCAT 
AGGACGACGT 
ACCCCGACAA 
ACCCGCCCCT 
ATGCCAGCGA 
TGGCCTCGGC 
GCACCAAGGA 
TGGGCACCAT 
TGGCTGGCAT 
ATGAG GATG A 
TTTCCGGCAA 
GGGCGCTGGC 
ACTGGCGGTC 
AGTACGCCCC 
CCGAGAAGGG 
AGCCTGGCCC 
AGTATCCAGA 



51 
I 

GGTTTTTGCT 60 

CGGGAGGCAG 120 

GCGGAAGATC 180 

CAAACAGATG 240 

CCAGCTCCTG 3 00 

GCTCTCCGAC 3 60 

CCACGGCGAG 42 0 

GACGGAATTG 480 

GGCGTGGTTT 54 0 

CTGCAGCTCC 600 

CGACTACCCG 6 60 

CACCATCATC 72 0 

CGACAACCCC 780 

CAGGACGGCG 840 

T CGG AT CATC 900 

GGTTGACAAC 960 

GAAC AG ACT C 1020 

GCAGCTCATG 10 80 

CAG CAGTGTT 1140 

GGTGGTACTG 1200 

CACATCGTCC 1260 

ATGTACCATC 132 0 

GTGGCGGTTC 13 80 

ACACGGCCGG 1440 

CGTGGACCAT 150 0 

CAAGAGGACC 1560 

TCTCAACTGC 1620 

GGGGAAGCCG 1680 

CGCTGAGGGC 1740 

GAAGTCCGGG 1800 

TTGGACGAAG 1860 

AGGCTACCTG 1920 



356 



10 



15 



20 



25 



30 



WO 02/086443 

GAAGCCCTGG CCAACCGAGA 
CAGGAGGGGG GCTTCGCGTC 
GGAGGTGGCC CGAGCAGGGC 
CCCTACAGTC TCACGGCCCA 
CTGTGGAATG AGGTCCTGGC 
TTGTTCCTGA GTAAAGTGGA 
CGGCCCATCA CGACCGTGTG 
CGGG CACAGG TGTTCAGCTG 
CAGGTGAACC AGCCTCTGCA 
CGGTGAT CTC CAAGCACTTC 
CATCGGCACT GATTTTGTTC 
CCTAAAAAGG TTTGTCTTCC 
GAATTTATGT ATTCTGGCTA 
CATAAAAGCC TGCAATTTCT 
A CTACGTGGT GTGGAGGCTG 
CAACTCTTTA AGAAGGCGAC 
AGCAAGCATC TTCCTGACAG 
TGGCCCGTGG CAGCCCGTGG 
AAAGAGGAAA CATCTCGGGC 
TGCTTAGCGT CTGAGATCCG 
CACGCAGAAA TGGCCTCAAG 
TGTCCGACGA AGGCGGCCAC 
GATTCGTTCC TTCTTTCTAA 
GTCAACCAGA TTCTAGAAAC 
GGAACCGTTT GAGCCTTATA 
CTTACAAGAG GGTTTTTTTT 
TTTTTTTTGT AGTTACTGTA 
TTGTTTTTGT ATTTTTTTTC 
TTGCAGCCTA TACCTCAATA 
GAGCAATGTT ATTTTTAAAG 
AGGGAAGAAT GAGACAATTT 
TTAGATTCTC AGAATAAATG 



GCGAGAGAAG 
CCCCAGGACG 
CGGGTCCCCG 
GCAGAGCAGC 
GTCACTCAAG 
GGAGACGTTC 
CCAGCACAAC 
CCCTGCCTGC 
GACCGTCCTC 
TCGACAGGCG 
TTAGTGGGCT 
TTTTTTTTTA 
AAAGTTGGAC 
CGACAAAACA 
TTGATGTTTC 
AGGATCAGTC 
CATTTTGTCA 
CATGGCGTGG 
CTAGTTCAAA 
CGTGAAAAGT 
GGGACTCTGC 
GGACGGACGC 
AGACGACAGT 
TGCGGTCATC 
GATCATTTAC 
TAATTTTTTT 
TATGTACCAA 
TTTTGAAAGG 
AAACAGGGAT 
GGTTTTTTTC 
TGTGTAGGCT 
TTTTTCACAG 



GAGAACAGCA 
GGCAAGGGCA 
CGCCGGACAT 
CTCATCAGAG 
GACCGGCCGG 
CAGTGTATCT 
GTGTGCAAGG 
CGCTACGACC 
AACCAGCTCT 
TTTTGCTGAA 
TAACTTAAAC 
TTTTTATTTT 
TT CTCAGT AT 
ACACAAGATT 
TGGTGTCAAG 
CTTCTCTAGG 
TCTAAAGTCC 
CTCAGCTGTC 
CCTTTGCCTC 
CCTCTGCCCA 
TCCACGTGGG 
CAGCACACGA 
CTTTGTTGTT 
CAGTTCTTCC 
ATTCAATTTT 
TTCTCTTAAT 
GAAAGATATA 
GTTTGTTAAT 
AT TTTAAATC 
ACCTCCTTAT 
TTTTCTAAAG 
ATTGAAAAAA 



AGAGGGAGGA 
AGTGGAAGCG 
CCAAGAAAAC 
AGGACAAGAG 
CGAGCGGCAG 
GCTGT CAGGA 
ACTGCCTGGA 
TGGGCCGCAG 
TCCCCGGCTA 
AACGTGTCGG 
AGGTAGTGTT 
TCAAAT CTAT 
TGTGTTTAGT 
TTTTAAAGAT 
TTCTCAGAAG 
GTTCTGGCCC 
AGTGACATGG 
TGTTGAAGTT 
AAAGCCATCC 
CGAGAGCAGG 
GCCAGGCGTG 
AGTCACGTGC 
AGCACTGAAT 
TGACACCGGA 
TTTAACTCAG 
GAACACATTT 
ACGTTAGGGT 
TTTTCTAATT 
ACATACCTGC 
TCTTAGATTA 
TCCAGTACTT 
AAAAAAAA 



GGAGGAGCAG 1980 

GAAGTCGGCA 2040 

CAAGGTGGAG 2100 

CAACGCCAAG 2160 

CCCGTTCCAG 2220 

GCTGGTGTTC 2280 

CAGATCCTTT 2 340 

CTATGCCATG 2400 

CGGCAATGGC 2460 

AGGGCTCGTT 252 0 

TCCTCCGTTC 2580 

ACATTTTCAG 2 640 

TCTTTGAAAA 2700 

GGAATCAGAA 2760 

TTGCTGCCAC 2820 

CCAAGGTCAG 288 0 

TTCCCCGTGG 2940 

GTTGCAAGGA 3000 

CCCACCAGAC 3060 

GAGTTGGGGC 312 0 

TGACTGACGC 318 0 

AAGTGCCTTT 3240 

TATTGAAAAT 33 00 

TGGGTGCTTG 3360 

CAAGTGAGAA 3420 

TCTAAATGAA 3 480 

TTGGTTGTTT 354 0 

TTACCAAAGT 3600 

AGACAAACTG 3660 

TTAATGTATT 372 0 

TGTCCAGATT 3780 
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Seq ID NO j 455 Protein sequence 
35 Protein Accession #: NP 037414.2 



40 



45 



50 



MWIQVRTMDG 
YEVRLNDTIQ 
PADEDMWDET 
DV I YHVKYDD 
AEISRKRETR 
SCKHCKDDVN 
PECRNDASEV 
IPGIPVGTMW 
SGGRDLSGNK 
GGKNSKYAPA 
LGLTMQYPEG 
SPRRTSKKTK 
TFQCICCQEL 



11 
1 

RQTHTVDSLS 
LLVRQSLVLP 
ELGLYKVNEY 
YPENGWQMN 
TARELYANW 
RLCRVCACHL 
VLAGERLRES 
RFRVQVSESG 
RTAEQSCDQK 
EGNRYDGIYK 
YLEALANRER 
VEPYSLTAQQ 
VFRPITTVCQ 



21 
I 

RLTKVEELRR 
HSTKERDSEL 
VDARDTNMGA 
SRDVRARART 
LGDDSLNDCR 
CGGRQDPDKQ 
KKKAKMASAT 
VHRPHVAGIH 
LTNTNRALAL 
WKYWPEKGK 
EKENSKREEE 
SSLIREDKSN 
HNVCKDCLDR 



31 
I 

KIQELFHVEP 
SDTDSGCCLG 
WFEAQWRVT 
IIKWQDLEVG 
IIFVDEVFKI 
LMCDECDMAF 
SSSQRDWGKG 
GRSNDGAYSL 
NCFAPINDQE 
SGFLVWRYLL 
EQQEGGFASP 
AKLWNEVLAS 
SFRAQVFSCP 



41 



51 



GLQRLFYRGK 
QSESDKSSTH 
RKAPSRDEPC 
QWMLNYNPD 
ERPGEGSPMV 
HIYCLDPPLS 
MACV GRTKEC 
VLAGGYEDDV 
GAEAKDWRSG 
RRDDDEPGPW 
RTGKGKWKRK 
LKDRPASGSP 
ACRYDLGRSY 



QMEDGHTLFD 60 

GEAAAETDSR 120 

SSTSRPALEE 180 

NPKERGFWYD 240 

DNPMRRKSGP 300 

SVPSEDEWYC 360 

TIVPSNHYGP 420 

DHGNFFTYTG 4 BO 

KPVRWRNVK 540 

TKEGKDRIKK 60 0 

SAGGGPSRAG 660 

FQJjFLSKVEE 72 0 
AMQVNQPLQT 



55 



Seq ID NO: 456 DNA sequence 

Nucleic Acid Accession #s NM_001200.1 

Coding sequence: 325.. 1514 
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GGGGACTTCT 
TGCCCCAGCG 
TGCCCGACAC 
GAGAAGGAGG 
AGAGTTTTTC 
CTGCGGTCTC 
TTCCCCAGGT 
TCGCGGCGGC 
TCGAGTTGCG 
CCGTGGTGCC 
CCGCCCCAGA 
ACCATGAAGA 
TCTTTAATTT 
TCCGAGAACA 
TTTATGAAAT 
ACACCAGGTT 
TGATGCGGTG 
TGGAGGAGAA 
ATGAACACAG 
GGCATCCTCT 
AGTCCAGCTG 
GGATTGTGGC 
TGG CTGATCA 
ACTCTAAGAT 
ACCTTGACGA 
GTGGGTGTCG 



TGAACTTGCA 
GAGCCTGCTT 
TGAGACGCTG 
AGGCAAAGAA 
CATGTGGACG 
CTAAAGGTCG 
CCTCCTGGGC 
GTCGTCGGGC 
GCTGCTCAGC 
CCCCTACATG 
CCACCGGTTG 
ATCTTTGGAA 
AAGTTCTATC 
GATGCAAGAT 
CATAAAACCT 
GGTGAATCAG 
GACTGCACAG 
ACAAGGTGTC 
CTGGTCACAG 
CCACAAAAGA 
TAAGAGACAC 
TCCCCCGGGG 
TCTGAACTCC 
TCCTAAGGCA 
GAATGAAAAG 
CTAGTACAGC 



GGGAGAATAA 
CGCCATCTCC 
TTCCCAGCGT 
AAGGAACGGA 
CTCTTTCAAT 
ACCATGGTGG 
GGCGCGGCTG 
CGCCCCTCAT 
ATGTTCGGCC 
CTAGACCTGT 
GAGAGGGCAG 
GAACTACCAG 
CCCACGGAGG 
GCTTTAGGAA 
GCAACAG CCA 
AATGCAAGCA 
GGACACGCCA 
TCCAAGAGAC 
ATAAGGCCAT 
GAAAAACGTC 
CCTTTGTACG 
TATCACGCCT 
ACTAATCATG 
TGCTGTGTCC 
GTTGTATTAA 
AAAATTAAAT 



31 
I 

CTTGCGCACC 
GAGCCCCACC 
GAAAAGAGAG 
CATTCGGTCC 
GGACGTGTCC 
CCGGGACCCG 
GCCTCGTTCC 
CCCAGCCCTC 
TGAAACAGAG 
ATCGCAGGCA 
CCAGCCGAGC 
AAACGAGTGG 
AGTTT AT CAC 
ACAATAGCAG 
ACTCGAAATT 
GGTGGGAAAG 
ACCATGGATT 
ATGTTAGGAT 
TGCTAGTAAC 
AAGCCAAACA 
TGGACTTCAG 
TTTACTGCCA 
CCATTGTTCA 
CGACAGAACT 
AGAACTATCA 
ACATAAATAT 



41 

I 

CCACTTTGCG 
GCCCCTCCAC 
ACTGCGCGGC 
TTGCGCCAGG 
CCGCGTGCTT 
CTGTCTTCTA 
GGAGCTGGGC 
TGACGAGGTC 
ACCCACCCCC 
CTCAGGTCAG 
CAACACTGTG 
GAAAACAACC 
CTCAGCAGAG 
TTTCCATCAC 
CCCCGTGACC 
TTTTGATGTC 
CGTGGTGGAA 
AAGCAGGTCT 
TTTTGGCCAT 
CAAACAGCGG 
TGACGTGGGG 
CGGAGAATGC 
GACGTTGGTC 
CAGTGCTATC 
GGACATGGTT 
ATATATA 



51 
I 

CCGGTGCCTT 60 

TCCTCGGCCT 12 0 

CGGCACCCGG 180 

TCCTTTGACC 240 

CTTAGACGGA 3 00 

GCGTTGCTGC 3 60 

CGCAGGAAGT 420 

CTGAGCGAGT 480 

AGCAGGGACG 540 

CCGGGCTCAC 600 

CGCAGCTTCC 660 

CGGAGATTCT 720 

CTTCAGGTTT 780 

CGAATTAATA 840 

AGACTTTTGG 900 

ACCCCCGCTG 960 

GTGG CCCACT 1020 

TTGCACCAAG 10 80 

GATGGAAAAG 1140 

AAACGCCTTA 120 0 

TGGAATGACT 12 60 

CCTTTTCCTC 132 0 

AACTCTGTTA 13 80 

TCGATGCTGT 1440 

GTGGAGGGTT 1500 



Seq ID NO: 457 Protein sequence 
Protein Accession #: NP 001191.1 



357 



WO 02/086443 
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1 11 21 31 41 51 

I I I I I I 

MVAGTRCLLA LLLPQVLLGG AAGLVPELGR RKFAAASSGR PSSQPSDEVL SEFELRLLSM 60 

5 FGLKQRPTPS RDAWPPYML DLYRRHSGQP GSPAPDHRLE RAASRANTVR SFHHEESIiEE 120 

LPETSGKTTR RFFFNJjSSIP TEEFITSAEL QVFREQMQDA LGNNSSFHHR INIYEIIKPA 180 
TANSKFPVTR LLDT 

Seq ID NO: 458 DNA sequence 
10 Nucleic Acid Accession #: NM_001999.2 
Coding sequence: 1..8736 

1 11 21 31 41 51 

I l l I I l 

iO ATGGGGAGAA GACGGAGGCT GTGTCTCCAG CTCTACTTCC TGTGGCTGGG CTGTGTGGTG 60 

CTCTGGGCGC AGGGCACGGC CGGCCAGCCT CAGCCTCCTC CGCCCAAGCC GCCCCGGCCC 120 

CAGCCGCCGC CGCAACAGGT TCGGTCCGCT ACAGCAGGCT CTGAAGGCGG GTTTCTAGCG 180 

CCCGAGTATC GCGAGGAGGG TGCCGCAGTG GCCAGCCGCG TCCGCCGGCG AGGACAGCAG 240 

GACGTGCTCC GAGGGCCCAA CGTGTGCGGC TCCAGATTCC ACTCCTACTG CTGCCCTGGA 3 00 

20 TGGAAGACGC TCCCTGGAGG AAACCAGTGC ATTGT CCCGA TTTGTAGAAA TAGTTGTGGA 3 60 

GATGGATTTT GTTCCCGTCC TAACATGTGT ACTTGTTCCA GTGGGCAAAT ATCATCAACC 42 0 

TGTGGAT CAA AATCAATTCA GCAGTGCAGT GTGAGATGCA TGAATGGTGG GACCTGTGCA 48 0 

GATGACCACT GCCAGTGCCA GAAAGGATAT ATTGGAACTT ATTGTGGACA ACCTGTCTGT 540 

G AAAATG GAT GTCAGAATGG TGGACGTTGC ATCGCCCAAC CGTGTGCTTG TGTTTATGGG 60 0 

25 TTCACTGGTC CACAGTGTGA AAGAGATTAC AGGACAGGCC CGTGTTTCAC TCAGGTCAAC 660 

AACCAGATGT GCCAAGGGCA GCTGACAGGC ATTGTCTGCA CGAAGACTCT GTGCTGTGCC 72 0 

ACCACTGGAC GGGCGTGGGG CCATCCCTGT GAGATGTGTC CAGCCCAGCC TCAGCCCTGC 7 80 

CGACGGGGTT TCATCCCCAA CATCCGCACT GGAGCTTGCC AAGATGTTGA TGAATGCCAG 84 0 

GCTATCCCAG GGATATGCCA AGGAGGAAAC TGTATCAATA CAGTGGGCTC TTTTGAATGC 900 

30 AGATGCCCTG CTGGTCACAA ACAGAGTGAA ACTACTCAGA AATGTGAAGA CATTGATGAG 960 

TGCAGCATCA TTCCTGGGAT ATGTGAAACT GGTGAATGTT CCAACACCGT GGGAAGCTAT 1020 

TTTTGTGTTT QTCCACGTGG ATATGTAACC TCAACAGATG GCTCTCGATG CATCGATCAG 108 0 

AGAACAGGCA TGTGTTTCTC GGGCCTGGTG AATGGCCGCT GTGCACAAGA GCT CCCGGGG 1140 

AGAATGACGA AAATGCAGTG CTGCTGTGAG CCTGGCCGCT GCTGGGGCAT CGGAAC CAT T 12 0 0 

35 CCTGAAGCCT GTCCTGT CAG AGGTTCTGAG GAATATCGCA GACTTTGCAT GGATGGACTT 12 60 

CCAATGGGAG GAATTCCAGG GAGTGCTGGT TCCAGACCTG GAGG CACTGG GGGAAATGGC 132 0 

TTTGCCCCAA GTGG CAATGG CAATGG CT AT GGCCCAGGAG GGACAGGCTT CATCCCCATC 13 80 

CCTGGAGGCA ATGGCTTTTC TCCTGGCGTT GGGGGAGCCG GTGTGGGGGC CGGGGGACAG 1440 

GGACCTATCA TCACTGGACT AACAATTCTG AAC C AG AC AA TAGATATCTG TAAGCAT CAT 1500 

40 GCTAACCTTT GTTTAAATGG ACGCTGTATA CCAACTGTCT CAAGCTACCG ATGTGAATGC 15 60 

AACATGGGTT ATAAGCAGGA TGCAAATGGA GATTGTATAG ATGTTGATGA ATGCACATCA 162 0 

AATCCCTGCA CTAATGGAGA TTGTGTTAAC ACACCTGGTT CCTATTATTG TAAATGTCAT 1680 

GCTGGATTCC AGAGGACTCC TACCAAGCAA GCATGCATTG ATATTGATGA GTGCATCCAG 174 0 

AATGGGGTTC TTTGTAAAAA CGGTCGATGC GTGAACTCAG ATGGAAGTTT CCAGTGCATT 1800 

45 TGCAATGCCG GCTTTGAATT AACTACAGAT GGAAAAAACT GTGTTGATCA TGATGAATGT 1860 

ACAACTACCA ACATGTGTTT GAATGGAATG TGCATCAATG AAGATGGCAG CTTCAAGTGC 1920 

ATCTGCAAAC CAGGATTTGT CTTGGCTCCA AATGGGCGTT ACTGTACTGA TGTTGATGAA 1980 

TGCCAGACCC CAGGAATCTG CATGAATGGG CACTGCATCA ACAGTGAAGG GTCCTTCCGC 2040 

TGTGACTGTC CCCCAGGCCT GGCTGTGGGC ATGGATGGAC GTGTGTGTGT TG AT AC T CAC 2100 

50 ATGCGCAGTA CCTGCTATGG AGGAATCAAG AAAGGAGTGT GTGTGCGTCC TTTCCCCGGT 2160 

GCAGTGACCA AGTCCGAATG CTGCTGTGCC AATCCAGACT ATGGTTTTGG AGAACCCTGC 222 0 

CAGCCATGCC CTGCAAAAAA TTCAGCTGAA TTCCACGGCC TTTGTAGTAG TGGAGTAGGT 2280 

ATCACTGTGG ATGGAAGAGA TAT CAATGAA TGTGCTTTGG ATCCTGATAT ATGTGCCAAT 2340 

GGGATTTGTG AAAACTTACG TGGTAGTTAC CGTTGTAATT GCAACAGTGG CTATGAACCA 240 0 

55 GATGCCTCTG GAAGAAACTG TATTGACATT GATGAATGTT TAGTAAACAG ACTGCTTTGT 2460 

GATAACGGAT TGTGCCGAAA CACGCCAGGA AGTTACAGCT GTACGTGCCC ACCAGGGTAT 252 0 

GTGTTCAGGA CTGAGACAGA GACCTGTGAA GATATAAATG AATGTGAAAG CAACCCATGT 2580 

GTCAATGGGG CCTGCAGAAA CAACCTTGGA TCTTTCAATT GTGAATGTTC GCCCGGCAGC 2 64 0 

AAACTCAGCT CCACAGGATT GATCTGTATT GACAGCCTGA AGGGGACCTG TTGGCTCAAC 2700 

60 ATCCAGGACA GCCGCTGTGA GGTGAATATT AATGGAGCCA CTCTGAAATC TGAATGCTGT 2 760 

GCCACCCTCG GAGCCGCCTG GGGGAGCCCC TGTGAGCGGT GTGAACTAGA TACAGCTTGC 2 820 

CCAAGAGGGC TTGCCAGGAT TAAAGGTGTT ACGTGTGAAG ATGTTAATGA GTGTGAGGTG 2 880 

TTCCCTGGCG TTTGTCCAAA TGGACGCTGT GTCAACAGTA AGGGATCTTT TCATTGCGAG 2940 

TGCCCTGAAG GCCTTACGTT GGATGGGACT GGCCGTGTAT GTTTGGATAT TCGCATGGAG 3 000 

65 CAGTGTTACT TGAAGTGGGA TGAAGATGAA TGCATCCACC CCGTTCCTGG AAAGTT CCGC 3060 

ATGGATGCCT GCTGCTGTGC TGTCGGGGCG GCTTGGGGCA CCGAGTGTGA GGAGTGCCCC 312 0 

AAACCTGGCA CCAAGGAATA CGAGACACTG TGCCCCCGCG GGGCTGGCTT TGCTAACCGA 3180 

GGGGATGTTC TTACTGGGCG GCCATTTTAC AAAGACATCA ATGAATGCAA AGCATTTCCT 32 40 

GGGATGTGCA CTTATGGGAA GTGCAGAAAT ACAATCGGAA GCTTCAAATG CCGTTGCAAT 33 0 0 

70 AGTGGCTTTG CTCTAGACAT GGAGGAAAGA AACTGCACGG ACATCGACGA GTGCAGGATT 3 3 60 

TCTCCTGACC TCTGTGGCAG TGGAATCTGC GTCAATACAC CGGGCAGCTT TGAGTGCGAG 342 0 

TGCTTCGAAG GCTATGAAAG TGGCTTCATG ATGATGAAGA ACTGCATGGA CAT T G ACG G A 3480 

TGTGAACGTA ACCCTCTCCT TTGTAGGGGT GGCACCTGTG TGAACACTGA GGGCAGCTTT 3540 

CAGTGTGACT GCCCACTGGG ACACGAGCTG TCACCATCCC GTGAGGACTG TGTGGAT AT T 3600 

75 AATGAATGCT CCCTGAGTGA CAATCTCTGC AGAAATGGAA AATGTGTGAA CATGATTGGA 3 660 

ACCTATCAGT GCTCTTGCAA TCCTGGATAT CAGGCTACGC CAGACCGCCA GGGCTGTACA 3720 

GATATTGATG AATGTATGAT AATGAACGGA GGCTGTGACA CCCAGTGCAC AAATTCAGAG 3 780 

GGAAGCTACG AATGCAGCTG CAGTGAGGGT TATGCCCTGA TGCCAGATGG GAGATCGTGT 3 840 

GCAGACATTG ATGAATGTGA AAACAATCCT GATAT CTGTG ATGGCGGCCA GTGTACCAAC 3900 

80 ATTCCTGGAG AGTATCGCTG CCTCTGCTAT GATGGCTTCA TGGCTTCCAT GGACATGAAA 3 960 

ACATGCATTG ATGTCAATGA ATGTGACCTA AATTCAAATA TCTGCATGTT TGGGGAATGT 4020 

GAGAACACAA AGGGATCCTT CATTTGCCAC TGTCAGCTGG GTTACTCAGT GAAGAAGGGG 4080 

ACCACAGGAT GTACAGATGT GGATGAGTGT GAAATTGGTG CTCATAACTG CGACATGCAT 4140 

GCCTCATGTC TGAATATCCC AGGAAGCTTC AAGTGTAGCT GCAGAGAAGG CTGGATTGGA 4200 

85 AACGGCATCA AGTGTATTGA TCTGGACGAA TGTTCTAATG GAACCCACCA GTGTAG CAT C 42 60 

AATGCTCAGT GTGTAAATAC CCCGGGCTCA TACCGCTGTG CCTGCTCCGA AGGTTTCACT 4320 

GGTGATGGCT TTACCTGCTC AGATGTTGAT GAGTGTGCAG AAAACATAAA CCTCTGTGAG 43 80 
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AACGGACAGT GCCTTAATGT CCCGGGTGCA TATCGCTGCG AGTGTGAGAT GGGCTTCACT 4440 

CCAGCCTCAG ACAGCAGATC CTGCCAAGAT ATTGATGAAT GCTCCTTCCA AAACATTTGT 4500 

GTCTCTGGAA CATGTAATAA CCTGCCTGGA ATGTTTCATT GCATCTGCGA TGATGGTTAT 4560 

GAATTGGACA GAACAGGAGG GAACTGTACA GATATTGATG AGTGTGCAGA TCCTATAAAC 4620 

TGTGTCAATG GCCTATGTGT CAACACGCCT GGTCGCTATG AGTGTAACTG CCCACCCGAT 4680 

TTTCAGTTGA ACCCAACTGG TGTGGGTTGT GTTGACAACC GTGTGGGCAA CTGCTACCTG 4740 

AAGTTTGGAC CT CGAGG AG A TGGGAGTCTG TCTTGCAACA CCGAGATCGG GGTGGGCGTC 4800 

AGTCGCTCTT CATGCTGCTG CTCTCTGGGA AAGGCCTGGQ GAAACCCCTG TGAGACATGC 4860 

CCCCCTGTCA ATAGCACTGA ATATTACACC CTGTGT CCCG GAGGTGAAGG CTTCAGACCT 492 0 

AACCCCATCA CAATCATTTT AGAAGACATT GACGAATGCC AGGAGTTACC AGGTCTCTGC 4980 

CAGGGTGGAA ACTG CAT CAA CACTTTTGGG AGCTTCCAGT GTGAGTGCCC ACAAGGCTAC 5040 

TACCT CAGCG AGGATACCCG CATCTGTGAG GATATTGATG AGTGTTTTGC ACATCCTGGT 5100 

GTGTGTGGGC CTGGGACCTG CTATAACACC CTGGGAAATT ACACCTGCAT TTGCCCACCT 5160 

GAGTACATGC AGGTCAATGG AGGCCACAAC TGCATGGACA TGAGAAAAAG CTTTTGCTAC 5220 

CGAAGCTATA ATGGAACCAC TTGTGAGAAT GAGTTGCCTT TCAATGTGAC AAAAAGGATG 52 80 

TGCTGCTGCA CATATAATGT GGGCAAAGCT GGGAACAAAC CTTGTGAACC ATGCCCAACT 5340 

CCAGGAACAG CTGACTTTAA AACCATATGT GGAAATATTC CTGGATTCAC CTTTGACATT 5400 

CACACAGGAA AAGCTGTTGA CATTGATGAA TGTAAAGAGA TTCCAGGCAT TTGTGCAAAT 5460 

GGTGTGTGCA TTAACCAGAT TGGCAGTTTC CGCTGTGAAT GCCCTACAGG ATTCAGTTAC 552 0 

AATGACCTGC TGTTGGTTTG TGAAGATATA GATGAGTGCA GCAATGGTGA TAATCTCTGC 5580 

CAGCGGAATG CAGACTGCAT CAATAGTCCT GGTAGTTACC GCTGTGAATG TGCCGCGGGT 5640 

TTCAAACTTT CACCCAATGG GGCCTGTGTA GATCGCAATG AATGTTTAGA AATTCCTAAC 5700 

GTTTGCAGTC ATGGCTTGTG TGTTGATCTG CAAGGAAGTT ACCAGTGCAT CTGCCACAAT 5760 

GGCTTTAAGG CTTCTCAGGA CCAGACCATG TGCATGGATG TTGATGAGTG CGAGCGGCAC 5 820 

CCATGTGGAA ATGGAACTTG TAAAAACACC. GTTGGATCCT ATAACTGTCT GTGCTACCCA 5 880 

GGGTTTGAAC TCACTCATAA TAATGATTGC CTGGACATAG ATGAGTGCAG TTCCTTTTTT 5 940 

GGTCAGGTGT GCAGAAATGG ACGTTGTTTT AATGAAATTG GTTCTTTCAA GTGTCTATGT 6000 

AACGAAGGTT ATGAACTTAC CCCAGATGGC AAAAACTGTA TAGACACTAA TGAGTGTGTC 6060 

GCCCTTCCCG GCTCTTGCTC TCCTGGTACC TGTCAGAATT TGGAGGGATC CTTCAGATGC 6120 

ATCTGTCCCC CAGGGTATGA AGTAAAAAGC GAGAACTGCA TTGATATAAA TGAATGTGAT 6180 

GAAGATCCCA ACATTTGTCT TTTTGGTTCC TGTACTAATA CTCCAGGGGG CTTCCAGTGC 6240 

CTCTGCCCCC CTGGCTTTGT ACTATCTGAT AATGGACGGA GATGCTTTGA TACTCGCCAG 6300 

AGCTTCTGCT TCACAAATTT TGAAAATGGA AAGTGTTCTG TACCCAAAGC TTTCAACACC 6360 

ACAAAAGCAA AATGCTGCTG TAGTAAGATG CCAGGAGAGG GCTGGGGGGA CCCCTGTGAG 642 0 

CTGTGCCCCA AAGACGATGA AGTTGCATTT CAGGATTTGT GTCCATATGG CCATGGAACT 6480 

GTCCCTAGTC TTCATGATAC ACGTGAAGAT GTCAATGAGT GT CTTGAGAG CCCAGGCATT 6540 

TGTTCAAATG GT CAATGT AT CAACACCGAC GGATCTTTTC GCTGTGAATG TCCAATGGGC 660 0 

TACAACCTTG ACTACACTGG AGTACGCTGT GTGGATACTG ATGAGTGTTC AATCGGCAAT 6660 

CCGTGTGGAA ATGGTACATG CACCAATGTT ATTGGGAGTT TTGAATGCAA TTGCAATGAA 672 0 

GGCTTTGAGC CAGGGCCCAT GATGAATTGT GAAGATATCA ACGAATGTGC CCAGAACCCA 67 80 

CTGCTGTGTG CTTTACGCTG CATGAACACT TTTGGGTCCT ATGAATGCAC GTGCCCGATT 6840 

GGCTATGCCC TCAGGGAAGA TCAAAAGATG TGCAAAGATC TGGATGAATG TGCTGAAGGG 6 900 

TTACACGACT GTGAATCTAG GGGCATGATG TGTAAGAATC TAATCGGCAC CTTCATGTGC 6 960 

ATCTGCCCTC CTGGAATGGC CCGAAGGCCC GATGGAGAAG GCTGTGTAGA TGAAAATGAA 7020 

TGCAGGACCA AG CCAGG AAT CTGTGAAAAT GGACGTTGTG TTAACATTAT TGGAAGCTAT 7080 

AGATGTGAGT GTAATGAAGG ATTCCAGT C A AGTTCTTCAG GCACTGAATG CCTTGACAAT 7140 

CGACAGGGTC TCTGCTTTGC AGAGGTACTG CAGACAATAT GTCAAATGGC ATCCAGTAGT 72 0 0 

CGCAATCTCG TCACTAAGTC AGAATGCTGC TGTGATGGTG GGCGAGGCTG GGGCCACCAG 7260 

TGCGAGCTTT GCCCACTTCC TGGAACTGCC CAGTACAAAA AGATATGTCC TCATGGCCCA 73 2 0 

GGATATACAA CTGATGGAAG AGATATTGAT GAATGTAAGG TAATGCCAAA CCTCTGCACC 73 80 

AATGGTCAGT GCATCAATAC CATGGGCTCA TTCCGATGCT TCTGCAAGGT TGGCTACACC 7440 

ACAGACATCA GTGGAACCTC TTGTATAGAC, CTTGATGAAT GCTCCCAGTC CCCGAAACCA 7500 

TGCAACTACA TCTGCAAGAA CACTGAGGGG AGTTATCAGT GTTCATGTCC GAGGGGGTAT 7560 

GT CCTGCAAG AGGATGGAAA GACATGCAAA GACCTTGATG AATGTCAAAC AAAGCAGCAT 762 0 

AACTGCCAGT TCCTCTGTGT CAACACCCTG GGGGGGTTTA CCTGTAAATG TCCACCTGGT 7680 

TTCACACAGC ATCACACTGC TTGTATCGAC AACAACGAAT GTGGGTCTCA ACCTTTGCTT 7740 

TGTGGAGGAA AGGGAATCTG TCAAAACACT CCAGGCAGTT TCAGCTGTGA ATGCCAAAGA 7800 

GGGTTCTCTC TTGATGCCAC CGGACTGAAC TGTGAAGATG TTGATGAATG TGATGGGAAC 7860 

CACAGGTGCC AACACGGCTG CCAGAACATC CTGGGTGGCT ACAGATGTGG CTGCCCCCAA 7 920 

GGCTACATCC AG CACTACCA GTGGAATCAG TGTGTCGATG AGAATGAATG CTCCAATCCC 7 980 

AATGCCTGTG GCTCTGCTTC CTGCTACAAC ACCCTGGGGA GTTACAAGTG CGCCTGCCCC 8040 

TCGGGGTTCT CCTTCGACCA GTTCTCCAGT GCCTGCCACG ACGTGAATGA GTGCTCGTCC 8100 

TCCAAGAACC CCTGCAATTA CGGCTGCTCT AACACGGAGG GGGGCTACCT CTGTGGCTGC 8160 

CCCCCTGGGT ATTACAGAGT GGGACAAGGC CACTGTGTCT CAGGAATGGG ATTTAACAAG 8220 

GGGCAGTACC TGT CACTGGA TACAGAGGTC GATGAGGAAA ATGCTCTGTC CCCAGAAGCA 82 80 

TGCTACGAGT GCAAAATCAA CGGCTATCCT AAGAAAGACA GCAGGCAGAA GAGAAGTATT 8340 

CATGAACCTG ATCCCACTGC TGTTGAACAG ATCAGCCTAG AGAGTGTCGA CATGGACAGC 8400 

CCCGTCAACA TGAAGTTCAA CCTCTCCCAC CTCGGCTCTA AGGAGCACAT CCTGGAACTA 8460 

AGGCCCGCCA TCCAGCCCCT CAACAACCAC ATCCGTTATG TCATCTCTCA AGGGAACGAT 8520 

GACAGCGTCT TCCGCATCCA CCAAAGGAAT GGGCTCAGCT ACTTGCACAC GGCCAAGAAG 8580 

AAGCTCATGC CCGGCACATA CACACTGGAA ATCACTAGCA TCCCTCTCTA CAAGAAGAAG 8 640 

GAGCTTAAGA AACTGGAAGA GAGCAATGAG GATGACTACC TCCTAGGGGA GCTTGGGGAG 8700 

G CT CT C AG AA TGAGGCTGCA GATTCAGCTC TATTAACCGT TCACAGACTT GGGCCCAGGC 8760 

TCAAATCCTA GCACAGCCAG TCTGCAGAAG CATTTGAAAA GTCAAGGACT AATTTTAAAG 8 82 0 

AGGAAAAATA ATAATAACTC TTGTTTCTTT CCTCCCTGTC TTAGACTTTG AATGTTGACC 8880 

CTCACAGGGA GGGATAATTT AGACTCTGGT ATGGCCAAAG ATTTGAGCTC AAAGGCAACC 8940 

GTGGTTACTG TATTTTTTAT ATAACTTCAT TTTAAAATAT AT T AAAAG AA ACCTAAATGT 9000 

TCAAGATATC AGCATATGGC ACTAAATGCA CAAAAATAAT GTGAGCTTTT TTTTTTTTTT 90 60 

CCTGTTAGCA GTCTGTAACA CTTTGGGTAT TTTGCTATAG TTGCTAATTA AAAAAATATA 9120 

GATGTTTATT TATTTTTAAT GCAGTAATAT ATGGAGAAAT GAACAAACTA TGTAAACAAA 9180 

AAGGGAAACT CACTTGTTTT TCTTTAGATT TATAAATTTG AGCTATTTTT TTTAGAGGTG 9240 

CTTTTTAAAA ATCCAATAGA TACAAGAGAT GTTTCCTTTG GTTTTCTGCC AGTCATCCAG 9300 

CTGATACACA CCTGAT CGAT TTTAAAGAAA GCCACACAGA GCTGAATCGG GCAGTGCTAA 9360 

TCAATAATTT AAAAGACATG AATGTCATTA GAT CCTTTAT AACGTAGATC GAAGCCAAAG 9420 

CAGCTCATTT GTGACAACAT TTCATATCAC CAGACACACC AGGCAACAGA AGTTGAAGCA 9480 

CAACCACTGT AGCAAAATAC CTTGACTGCT TGTGAGACCA TTAGCATTGC AGGCCAAACC 9540 

GTACTGTATT TCCTTCTCAT AACCTCAAGG AACCATATGT GCTACCCACA ACACCTCATT 960 0 
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CTTACCCAGG GTGCGCTGCG 
TTGAAAGGGA ACACCTGGCA 
ATTATGTTCA AGTTATTTCA 
GGAATATATG TTGTTGTTGT 
TGTAGTTATA CACCATATGC 
ACAATGAATT GATGTTTAGT 
TATTAAGAGC ACGTATCCAT 
CCAAACCTCA TATGTGAAAT 
CTGTGCTGAC CAAAGATTAG 
TTAATAACTA AAAAAAAACT 



TCCTCATGGT 
TTCTGTGGTG 
GGATTGCCAT 
TGTTTTAAAC 
CTCATTTTAT 
TTGCTTTAGT 
TATTCTTCTC 
GGCCAAAGCA 
TAACCAGTTA 
CGTGCC 



ACTGTAGGCA 
TTTCGTGCTG 
ATGTGCAAAC 
CCATTTTTTT 
CATAGCCTAT 
CATTTAAAAA 
AACCCAAGAA 
CATGCAGGCT 
TACCCAGTAT 



GCTGAAGAAC 
TCTTAAATAA 
AAATCATGCA 
TTTAGAATTT 
TGTGTATGAA 
GATATTGTAC 
CCTGTTTCCT 
CCTGGTTGTT 
TTTGAGGTTT 



CGCCGTTCCC 
TGGTGCATTT 
ATGCAGCCAA 
TCATTAATAC 
AGATGTTTGT 
CAGGATGTGC 
GGACCAGTGA 
CCTCTCAAAC 
TATTGTTTTT 



9660 
9720 
9780 
9840 
9900 
9960 
10020 
10080 
10140 



Seq ID NO: 459 Protein sequence 
Protein Accession #: NP 001990.1 



1 11 21 31 41 51 

I I I 1 I I 

MGRRRRLCLQ LYFLWLGCW LWAQGTAGQP QPPPPKPPRP QPPPQQVRSA TAGSEGGFLA 60 

PEYREEGAAV ASRVRRRGQQ DVLRGPNVCG SRFHSYCCPG WKTLPGGNQC IVPICRNSCG 12 0 

DGFCSRPNMC TCSSGQISST CGSKSIQQCS VRCMNGGTCA DDHCQCQKGY IGTYCGQPVC 180 

ENGCQNGGRC IAQPCACVYG FTGPQCERDY RTGPCFTQVN NQMCQGQI/TG IVCTKTLCCA 240 

TTGRAWGHPC EMCPAQPQPC RRGFIPNIRT GACQDVDECQ AIPGICQGGN CINTVGSFEC 300 

RCPAGHKQSE TTQKCEDIDE CSIIPGICET GECSNTVGSY FCVCPRGYVT STDGSRCIDQ 3 60 

RTGMCFSGLV NGRCAQELPG RMTKMQCCCE PGRCWGIGTI PEACPVRGSE EYRRLCMDGL 42 0 

PMGGIPGSAG SRPGGTGGNG FAPSGNGNGY GPGGTGFIPI PGGNGFSPGV GGAGVGAGGQ 480 

GPIITGLTIL NQTIDICKHH ANLCLNGRCI PTVSSYRCEC NMGYKQDANG DCIDVDECTS 540 

NPCTNGDCVN TPGSYYCKCH AGFQRTPTKQ ACIDIDECIQ NGVLCKNGRC VNSDGSFQCI 600 

CNAGFELTTD GKNCVDHDEC TTTNMCLNGM CINEDGSFKC ICKPGFVLAP NGRYCTDVDE 660 

CQTPGICMNG HCINSEGSFR CDCPPGLAVG MDGRVCVDTH MRSTCYGGIK KGVCVRPFPG 72 0 

AVTKSECCCA NPDYGFGEPC QPCPAKNSAE FHGLCSSGVG ITVDGRDINE CALDPD I CAN 780 

GICENLRGSY RCNCNSGYEP DASGRNCIDI DECLVNRLLC DNGLCRNTPG SYSCTCPPGY 840 

VFRTETETCE DINECESNPC VNGACRNNLG SFNCECSPGS KLSSTGLICI DSLKGTCWLN 900 

IQDSRCEVNI NGATLKSECC ATLGAAWGSP CERCELDTAC PRGLARIKGV TCEDVNECEV 960 

FPGVCPNGRC VNSKGSFHCE CPEGLTLDGT GRVCLDIRME QCYLKWDEDE CIHPVPGKFR 102 0 

MDACCCAVGA AWGTECEECP KPGTKEYETIi CPRGAGFANR GDVLTGRPFY KDINECKAFP 10 80 

GMCTYGKCRN TIGSFKCRCN SGFALDMEER NCTDIDECRI SPDLCGSGIC VNTPGSFECE 1140 

CFEGYESGFM MMKNCMDIDG CERNPLLCRG GTCVNTEGSF QCDCPLGHEL SPSREDCVDI 1200 

NECSLSDNLC RNGKCVNMIG TYQCSCNPGY QATPDRQGCT DIDECM1MNG GCDTQCTNSE 12 60 

GSYECSCSEG YALMPDGRSC ADIDECENNP DICDGGQCTN IPGEYRCLCY DGFMASMDMK 13 20 

TCIDVNECDL NSNICMFGEC ENTKGSFICH CQLGYSVKKG TTGCTDVDEC EIGAHNCDMH 13 80 

ASCLNIPGSF KCSCREGWIG NGIKCIDLDE CSNGTHQCSI NAQCVNTPGS YRCACSEGFT 1440 

GDGFTCSDVD ECAENINLCE NGQCLNVPGA YRCECEMGFT PASDSRSCQD IDECSFQNIC 150 0 

VSGTCNNLPG MFHCICDDGY ELDRTGGNCT DIDECADPIN CVNGLCVNTP GRYECNCPPD 1560 

FQLNPTGVGC VDNRVGNCYL KFGPRGDGSL SCNTEIGVGV SRSSCCCSLG KAWGNPCETC 162 0 

PPVNSTEYYT LCPGGEGFRP NPITIILEDI DECQELPGLC QGGNCINTFG SFQCECPQGY 1680 

YLSEDTRICE DIDECFAHPG VCGPGTCYNT LGNYTCICPP EYMQVNGGHN CMDMRKSFCY 1740 

RSYNGTTCEN ELPFNVTKRM CCCTYNVGKA GNKPCEPCPT PGTADFKTIC GNIPGFTFDI 180 0 

HTGKAVD IDE CKEIPGICAN GVCINQIGSF RCECPTGFSY NDLLLVCEDI DECSNGDNLC 1860 

QRNADCINSP GSYRCECAAG FKLSPNGACV DRNECLEIPN VCSHGLCVDL QGSYQCICHN 192 0 

GFKASQDQTM CMDVD ECERH PCGNGTCKNT VGSYNCLCYP GFELTHNNDC LDIDECSSFF 1980 

GQVCRNGRCF NEIGSFKCLC NEGYELTPDG KNCIDTNECV ALPGSCSPGT CQNLEGSFRC 2 040 

ICPPGYEVKS ENCIDINECD EDPNICLFGS CTNTPGGFQC LCPPGFVLSD NGRRCFDTRQ 210 0 

SFCFTNFENG KCSVPKAFNT TKAKCCCSKM PGEGWGDPCE LCPKDDEVAF QDLCPYGHGT 2160 

VPSLHDTRED VNECLESPGI CSNGQCINTD GSFRCECPMG YNLDYTGVRC VDTDECSIGN 222 0 

PCGNGTCTNV IGSFECNCNE GFEPGPMMNC EDINECAQNP LLCALRCMNT FGSYECTCPI 22 8 0 

GYALREDQKM CKDLDECAEG LHDCESRGMM CKNLIGTFMC ICPPGMARRP DGEGCVDENE 23 40 

CRTKPGICEN GRCVNIIGSY RCECNEGFQS SSSGTECLDN RQGLCFAEVL QTICQMASSS 2 40 0 

RNLVTKSECC CDGGRGWGHQ CELCPLPGTA QYKKICPHGP GYTTDGRDID ECKVMPNLCT 2460 

NGQCINTMGS FRCFCKVGYT TDISGTSCID LDECSQSPKP CNYICKNTEG SYQCSCPRGY 252 0 

VLQEDGKTCK DLDECQTKQH NCQFLCVNTL GGFTCKCPPG FTQHHTACID NNECGSQPLL 2580 

CGGKGICQNT PGSFSCECQR GFSLDATGLN CEDVDECDGN HRCQHGCQNI LGGYRCGCPQ 2 640 

GYIQHYQWNQ CVDENECSNP NACGSASCYN TLGSYKCACP SGFSFDQFSS ACHDVNECSS 2700 

SKNPCNYGCS NTEGGYLCGC PPGYYRVGQG HCVSGMGFNK GQYLSLDTEV DEENALSPEA 2760 

CYECKINGYP KKDSRQKRSI HEPDPTAVEQ ISIiESVDMDS PVNMKFNLSH LGSKEHILEI, 2 82 0 

RPAI QPLNNH IRYVISQGND DSVFRIHQRN GLSYLHTAKK KLMPGTYTLE ITSIPLYKKK 2 880 
ELKKLEESNE DDYLLGELGE ALRMRLQIQL Y 



Seq ID NO: 460 DNA sequence 

Nucleic Acid Accession NM__013372.1 

Coding sequence: 63,. 617 



GCGGCCGCAC 
GTATGAGCCG 
CGGCTGCTGA 
AGCACAATGA 
GGGGCCAAGG 
CCCTGCATGT 
AGCAGACCAT 
GCCAGTGCAA 
CCTGCTCCTT 
AACTACAGCC 
CCATCGATTT 
AGGAAGTCCC 
AACCCCCAGC 
ATGGGTGCCT 
CCCTATTTTG 



11 
I 

TCAGCGCCAC 
CACAGCCTAC 
AGGGAAAAAG 
CTCAGAGCAG 
GCGGGGCACT 
GACGG AG CGC 
CCACGAGGAA 
CTCTTTCTAC 
CTGCAAGCCC 
ACCTACCAAG 
GGATTAAGCC 
AGACCTAAAA 
TGCCTCCTGG 
GTGGGTGTTT 
TAAACATATC 



21 
I 

GCGTCGAAAG 
ACGGTGGGAG 
AAAGGGTCCC 
ACTCAGTCGC 
GCCATGCCCG 
AAATACCTGA 
GGCTGCAACA 
ATCCCCAGGC 
AAGAAATTCA 
AAGAAGAGAG 
AAATCCAGGT 
CAACCAGATT 
CAGGAGCCTG 
TTAGACACCA 
TGCTTTAATG 



31 
I 

CGCAGGCCCC 
CCCTGCTTCT 
AAGGTGCCAT 
CCCAGCAGCC 
GGGAGGAGGT 
AGCGAGACTG 
GTCGCACCAT 
ACATCCGGAA 
CTACCATGAT 
TCACACGTGT 
GCACCCAGCA 
CTTACTTGGC 
CTTGTGCGTA 
GAGAAAACAC 
GGGATGTACC 



41 

I 

GAGGACCCGC 
CCTCTTGGGG 
CCCCCCGCCA 
TGGCTCCAGG 
GCTGGAGTCC 
GTGCAAAACC 
CATCAACCGC 
GGAGGAAGGT 
GGTCACACTC 
GAAGCAGTGT 
TGTCCTAGGA 
T TAAAC CTAG 
GTTCGTGTGC 
AGTCTCTGCT 
AGAAACCCAC 



51 

I 

CGCACTGACA 60 

ACCCTGCTGC 12 0 

GACAAGGCCC 180 

AACCGGGGGC 240 

AGCCAAGAGG 3 0 0 

CAGCCGCTTA 3 60 

TTCTGTTACG 420 

TCCTTTCAGT 480 

AACTGCCCTG 540 

CGTT G CAT AT 600 

ATGCAGCCCC 660 

AGGCCAGAAG 720 

ATGAGTGTGG 780 

AGAGAGCACT 840 

CTCACCCCGG 900 
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CTCACATCTA AAGGGG CGGG GCCGTGGTCT GGTTCTGACT TTGTGTTTTT GTGCCCTCCT 960 

GGGGACCAGA ATCTCCTTTC GGAATGAATG TTCATGGAAG AGGCTCCTCT GAGGGCAAGA 102 0 

GACCTGTTTT AGTGCTG CAT TCGACATGGA AAAGTCCTTT TAACCTGTGC TTGCATCCTC 1080 

CTTTCCTCCT CCTCCTCACA ATCCATCTCT TCTTAAGTTG ATAGTGACTA TGTCAGTCTA 1140 

ATCTCTTGTT TGCCAAGGTT CCTAAATTAA TTCACTTAAC CATGATGCAA ATGTTTTTCA 12 0 0 

TTTTGTGAAG ACCCTCCAGA CTCTGGGAGA GGCTGGTGTG GGCAAGGACA AGCAGGATAG 12 60 

TGGAGTGAGA AAGGGAGGGT GGAGGGTGAG GCCAAATCAG GTCCAGCAAA AGTCAGTAGG 132 0 

GACATTGCAG AAGCTTGAAA GGCCAATACC AGAACACAGG CTGATGCTTC TGAGAAAGTC 13 80 

TTTTCCTAGT ATTTAACAGA ACCCAAGTGA ACAGAGGAGA AATGAGATTG CCAGAAAGTG 1440 

ATTAACTTTG GCCGTTGCAA TCTGCTCAAA CCTAACACCA AACTGAAAAC ATAAATACTG 1500 

ACCACTCCTA TGTTCGGACC CAAGCAAGTT AGCTAAACCA AACCAACTCC TCTGCTTTGT 1560 

CCCTCAGGTG GAAAAGAGAG GTAGTTTAGA ACTCTCTGCA TAGGGGTGGG AATTAATCAA 1620 

AAACC KCAGA GGCTGAAATT CCTAATACCT TTCCTTTATC GTGGTTATAG TCAGCTCATT 1680 

TCCATTCCAC TATTTCCCAT AATGCTTCTG AGAGCCACTA ACTTGATTGA TAAAGATCCT 1740 

GCCTCTGCTG AGTGTACCTG ACAGTAAGTC TAAAGATGAR AGAGTTTAGG GACTACTCTG 1800 

TTTTAGCAAG ARATATTKTG GGGGTCTTTT TGTTTTAACT ATTGTCAGGA GATTGGGCTA 1860 

RAGAGAAGAC GACGAGAGTA AGGAAATAAA GGGRATTGCC TCTGGCTAGA GAGTAAGTTA 1920 

GGTGTTAATA CCTGGTAGAA ATGTAAGGGA TATGACCTCC CTTTCTTTAT GTGCTCACTG 1980 

AGGATCTGAG GGGACCCTGT TAGG AG AG CA TAGCATCATG ATGTATTAGC TGTTCATCTG 2040 

CTACTGGTTG GATGGACATA ACTATTGTAA CTAT TCAGT A TTTACTGGTA GGCACTGTCC 210 0 

TCTGATTAAA CTTGGCCTAC TGGCAATGGC TACTTAGGAT TGATCTAAGG GCCAAAGTGC 2160 

AGGGTGGGTG AACTTTATTG TACTTTGGAT TTGGTTAACC TGTTTTCTTC AAGCCTGAGG 2220 

TTTTATATAC AAACTCCCTG AATACTCTTT TTGCCTTGTA TCTTCTCAGC CTCCTAGCCA 2280 

AGTCCTATGT AATATGGAAA ACAAACACTG CAGACTTGAG ATTCAGTTGC CGATCAAGGC 2340 

TCTGGCATTC AGAGAACCCT TGCAACTCGA GAAGCTGTTT TTATTTCGTT TTTGTTTTGA 2400 

TCCAGTGCTC TCCCATCTAA CAACTAAACA GGAGCCATTT CAAGGCGGGA GATATTTTAA 2460 

ACACCCAAAA TGTTGGGTCT GATTTTCAAA CTTTTAAACT CACTACTGAT GATTCTCACG 2520 

CTAGGCGAAT TTGTCCAAAC ACATAGTGTG TGTGTTTTGT ATACACTGTA TGACCCCACC 2580 

CCAAAT CTTT GTATTGTCCA CATTCTCCAA CAATAAAGCA CAGAGTGGAT TTAATTAAGC 2640 

ACACAAATGC TAAGGCAGAA TTTTGAGGGT GGGAGAGAAG AAAAGGGAAA GAAGCTGAAA 2700 

ATGTAAAACC ACACCAGGGA GGAAAAATGA CATTCAGAAC CAGCAAACAC TGAATTTCTC 2760 

TTGTTGTTTT AACTCTGCCA CAAGAATGCA ATTTCGTTAA TGGAGATGAC TTAAGTTGGC 2 82 0 

AGCAGTAATC TTCTTTTAGG AGCTTGTACC ACAGTCTTGC ACATAAGTGC AGATTTGGCT 2 880 

CAAGTAAAGA GAATTTCCTC AACACTAACT TCACTGGGAT AATCAGCAGC GTAACTACCC 2 940 

TAAAAGCATA TCACTAGCCA AAGAGGGAAA TATCTGTTCT TCTTACTGTG CCTATATTAA 3 000 

GACTAGTACA AATGTGGTGT GTCTTCCAAC TTTCATTGAA AATG CC AT AT CTATACCATA 30 6 0 

TTTTATTCGA GTCACTGATG ATGTAATGAT ATATTTTTTC ATTATTATAG TAGAATATTT 312 0 

TTATGGCAAG ATATTTGTGG T CTTGAT CAT ACCTATTAAA ATAATGCCAA ACACCAAATA 3180 

TGAATTTTAT GATGTACACT TTGTGCTTGG CATTAAAAGA AAAAAACACA CATCCTGGAA 3240 

GTCTGTAAGT TGTTTTTTGT TACTGTAGGT CTTCAAAGTT AAGAGTGTAA GTGAAAAATC 33 0 0 

TGGAGGAGAG GATAATTTCC ACTGTGTGGA ATGTGAATAG TTAAATGAAA AGTTATGGTT 33 60 

AT T T AATGT A ATTATTACTT CAAATCCTTT GGTCACTGTG ATTTCAAGCA TGTTTTCTTT 3420 

TTCTCCTTTA TATGACTTTC TCTGAGTTGG GCAAAGAAGA AGCTGACACA CCGTATGTTG 3480 

TTAGAGTCTT TTATCTGGTC AGGGGAAACA AAATCTTGAC CCAGCTGAAC ATGTCTTCCT 3 540 

GAGTCAGTGC CTGAATCTTT ATTTTTTAAA TTGAATGTTC CTTAAAGGTT AACATTTCTA 3 60 0 

AAGCAAT AT T AAGAAAGACT TTAAATGTTA TTTTGGAAGA CTTACGATGC ATGTATACAA 3 660 

ACGAATAGCA GATAATGATG ACTAGTTCAC ACATAAAGTC CTTTTAAGGA GAAAATCTAA 3 72 0 

AATGAAAAGT GGATAAACAG AACATTTATA AGTGATCAGT TAATGCCTAA GAGTGAAAGT 3780 

AGTTCTATTG ACATTCCTCA AGATATTTAA TATCAACTGC ATTATGTATT ATGTCTGCTT 3 840 

AAATCATTTA AAAACGGCAA AGAATTATAT AGACTATGAG GTACCTTGCT GTGTAGGAGG 3 900 

ATGAAAGGGG AGTTGATAGT CTCATAAAAC TAATTTGGCT TCAAGTTTCA TGAATCTGTA 3 960 

ACTAGAATTT AATTTTCACC CCAATAATGT TCTATATAGC CTTTGCTAAA GAGCAACTAA 402 0 
TAAATTAAAC CTATTCTTTC AAAAAAAAA 
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MSRTAYTVGA LLLLLGTLLP AAEGKKKGSQ GAIPPPDKAQ HNDSEQTQSP QQPGSRNRGR 6 0 

GQGRGTAMPG EEVLESSQEA LHVTERKYLK RDWCKTQPLK QTIHEEGCNS RTI INRFCYG 12 0 

QCNSFYIPRH IRKEEGSFQS CSFCKPKKFT TMMVTLNCPE LQPPTKKKRV TRVKQCRCIS 180 
IDLD 
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ATGAAAGTTG GAGTGCTGTG GCTCATTTCT TTCTTCACCT TCACTGACGG CCACGGTGGC 60 

TTCCTGGGGA AAAATGATGG CATCAAAACA AAAAAAGAAC TCATTGTGAA TAAGAAAAAA 12 0 

CATCTAGGCC CAGTCGAAGA ATATCAGCTG CTGCTTCAGG TGACCTATAG AGATTCCAAG 180 

GAGAAAAGAG ATTTGAGAAA TTTTCTGAAG CTCTTGAAGC CTCCATTATT AT GGT CAC AT 240 

GGGCTAATTA GAATT AT CAG AGCAAAGGCT ACCACAGACT GCAACAGCCT GAATGGAGTC 300 

CTGCAGTGTA CCTGTGAAGA CAGCTACACC TGGTTTCCTC CCTCATGCCT TGATCCCCAG 3 60 

AACTGCTACC TTCACACGGC TGGAGCACTC CCAAGCTGTG AATGTCATCT CAACAACCTC 420 

AGCCAGAGTG TCAATTTCTG TGAGAGAACA AAGATTTGGG GCACTTTCAA AATTAATGAA 480 

AGGTTTACAA ATGACCTTTT GAATTCATCT TCTGCTATAT ACTCCAAATA TGCAAATGGA 540 

ATTGAAATTC AACTTAAAAA AGCATATGAA AGAATTCAAG GTTTTGAGTC GGTTCAGGTC 60 0 

ACCCAATTTC GAAATGGAAG CATCGTTGCT GGGTATGAAG TTGTTGGCTC CAGCAGTGCA 660 

TCTGAACTGC TGTCAGCCAT TGAACATGTT GCCGAGAAGG CTAAGACAGC CCTTCACAAG 720 

CTGTTTCCAT TAGAAGACGG CTCTTTCAGA GTGTTCGGAA AAGCCCAGTG TAATGACATT 780 

GTCTTTGGAT TTGGGTCCAA GGATGATGAA TATACCCTGC CCTGCAGCAG TGGCTACAGG 840 

GGAAACATCA CAGCCAAGTG. TGAGTCCTCT GGGTGGCAGG TCATCAGGGA GACTTGTGTG 90 0 

CTCTCTCTGC TTGAAGAACT GAACAAGAAT TTCAGTATGA TTGTAGGCAA TGCCACTGAG 960 

GCAGCTGTGT CATCCTTCGT GCAAAATCTT TCTGTCATCA TTCGGCAAAA CCCATCAACC 1020 
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ACAGTGGGGA ATCTGGCTTC 
GCCAGCCATT TCAGGGTGTC 
ATCCTTAATT CAGCCTCAGT 
AGCT CACGGT TACTAGAGAC 
CCTCTGAATT TTTCTCGGAA 
CTCAAAAGGG GTTACAGCTA 
AGAGGCCGTG TGTTAATTGG 
AGCATGGCCT CGTTGACTCT 
GTCAATGGAC CTGTGATATC 
TTTTTTTCCA AGATAGAGTC 
CATTTGCAGT GGAACGATGC 
TGCCAATGTA CTCACTTGAC 
ATCTTCCCCG TTGTAAAATG 
ATTTTATGCC TGATCATCGA 
CACACACGTC GTATTTG CAT 
TTTATTGTTG GTGCCACAGT 
GTGTTCTTTA CACACTTCTT 
CTGCTGGCTT ACCGGATCAT 
GTTGGATTTT GCCTGGGTTA 
ACGCAACCTA GCAATACCTA 
AGCAAACCAC TCCTGGCTTT 
GTGGTGCTGC TAGTTCTCAC 
GATGACAAGG CCACCATCAT 
GGGCTCACCT GGGGCTTTGG 
GTTATTTTTG CTTTACTCAA 
TTGGACAGTA AGCTGCGACA 
CAAACAGAAA AGCAAAACTC 
AACCCACTGC AAAACAAAGG 
AT CATGCTAA CTCAGTTTGT 



GGTGGTGTCG 
CAATTCAACA 
AACCAACTGG 
ATTAGAAAAC 
ATTCATTGAC 
TCAGATTAAA 
GTCAGACCAA 
GGGGAACATT 
CACGGTTATT 
AAACCTGAGC 
AGGCTGCCAC 
CTCCTTCTCC 
GATCACCTAT 
GGCTTTGTTT 
GGTGAACATA 
GGACACCACG 
CTACCTCTCT 
CCTCGTGTTC 
TGGGTGCCCT 
CAAAAGGAAA 
TGTTGTCCCT 
AAAGCTCTGG 
CCGCGTGGGG 
AATAGGAACA 
TGCATTCCAG 
ACTTCTGTTC 
ATCAGATTTA 
CCATTATGCA 
CTCAAATGAA 



ATTCTGAGCA 
ATGGAGGATG 
ACAGTCTTAC 
ATCAGCACTC 
TGGAAAGGGA 
ATGTGTCCCC 
TTCCAGAGAT 
CTACCCGTTT 
CAAAACTATT 
CAGCCTCATT 
CTAGTGAATG 
ATATTGATGT 
GTGGGACTGG 
TGGAAGCAGA 
GCCCTGTCCC 
GTGAACCCTT 
TTGTTCTTCT 
CATCACATGG 
CTCATTATAT 
GATGTGTGTT 
GCACTGGCTA 
AGGCCGACTG 
AAGAGCCTCC 
ATAGTGGACA 
GGATTTTTTA 
AACAAGTTGT 
TCTGCCAAAC 
TTTTCTCATA 
TAA 



ATATTTCATC 
TCAT CAGTAT 
TGCGGGAAGA 
TGGTGCCTCC 
TTCCAGTGAA 
AAAATACATC 
CCCTTCCAGA 
CCAAAAATGG 
CCATAAAT G A 
GTGTGTTTTG 
AAACTCAAGA 
CACCTTTTGT 
GTATCTCCAT 
TTAAAAAAAG 
TCTTGATTGC 
CTGGAGTCTG 
GGATGCTCAT 
CCCAGCATTT 
CTGT CATTAC 
GGCTTAACTG 
TTGTGGCTGT 
TTGGGGAAAG 
TCATTCTGAC 
GCCAGAATCT 
TCTTATGCTT 
CTGCCTTAAG 
CCAAATTCTC 
CTGGAGATTC 



TCTGTCACTG 1080 

AGCTGACAAT 1140 

AAAGTATGCC 1200 

GACAGCTCTT 1260 

CAAAAGCCAA 1320 

TATTCCCATC 1380 

AACTATTATC 1440 

AAATGCTCAG 150 0 

AGTTTTCCTA 1560 

GGATTTCAGT 1620 

CATCGTGACG 1680 

CCCCTCTACA 1740 

TGGAAGTCTC 1800 

CCAAACCTCT 1860 

TGATGTCTGG 1920 

CACAGCTGCT 1980 

GCTTGGCATC 2 040 

GATGATGGCT 2100 

CATTGCTGTC 2160 

GTCCAATGGA 222 0 

GAACTTCGTT 22 80 

ACTGAGTCGG 2 340 

CCCTCTGCTA 2400 

GGCTTGGCAT 24 60 

TGGAATACTC 2520 

TTCTTGGAAG 2580 

AAAGCCTTTC 2640 

CTCCGACAAC 2 700 
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35 



40 



45 



50 



MKVGVLWLIS 
EKRDLRNFLK 
NCYLHTAGAL 
IEIQLKKAYE 
LFPLEDGSFR 
LSLLEELNKN 
ASHFRVSNST 
PLNFSRKFID 
SMASLTLGNI 
HLQWNDAGCH 
ILCLIIEALF 
VFFTHFFYLS 
TQPSNTYKRK 
DDKAT I I RVG 
LDSKIiRQLLF 
IMLTQFVSNE 



11 
I 

FFTFTDGHGG 
LLKPPLLWSH 
PSCECHLNNL 
RIQGFESVQV 
VFGKAQCNDI 
FSM I VGNATE 
MEDVISIADN 
WKGIPVNKSQ 
LPVSKNGNAQ 
LVNETQDIVT 
WKQIKKSQTS 
LFFWMLMLGI 
DVCWLNWSNG 
KSLLILTPLL 
NKLSALSSWK 



21 

I 

FLGKNDG I KT 
GLIRIIRAKA 
SQSVNFCERT 
TQFRNGSIVA 
VFGFGSKDDE 
AAVSSFVQNL 
ILNSASVTNW 
LKRGYSYQIK 
VNGPVISTVI 
CQCTHLTSFS 
HTRRICMVNI 
LLAYRIILVF 
SKPLLAFWP 
GLTWGFGIGT 
QTEKQNSSDL 



31 

! 

KKELIVNKKK 
TTDCNSLNGV 
KIWGTFKINE 
GYEWGSSSA 
YTLPCSSGYR 
SVIIRQNPST 
TVLLREEKYA 
MCPQNTSIPI 
QNYSINEVFL 
ILMSPFVPST 
ALSLLIADVW 
HHMAQHLMMA 
ALAIVAVNFV 
IVDSQNLAWH 
SAKPKFSKPF 



41 
I 

HLGPVEEYQL 
LQCTCEDSYT 
RFTNDLLNSS 
SELL S A I EHV 
GNITAKCESS 
TVGNLASWS 
SSRLLETLEN 
RGRVLIGSDQ 
FFSKIESNLS 
IFPWKWITY 
FIVGATVDTT 
VGFCLGYGCP 
WLLVLTKLW 
VIFALLNAFQ 
NPLQNKGHYA 



51 
I 

LLQVTYRDSK 60 

WFPPSCLDPQ 120 

SAIYSKYANG 180 

AEKAKTALHK 240 

GWQVIRETCV 300 

ILSNISSLSL 3 60 

ISTLVPPTAL 42 0 

FQRSLPETII 4 80 

QPHCVFWDFS 540 

VGLGISIGSL 600 

VNPSGVCTAA 660 

LIISVITIAV 720 

RPTVGERLSR 780 

GFFILCFGIL 840 

FSHTGD S SDN 900 



55 
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60 



65 



70 



75 



80 



85 



GGGCATGCAG 
CAGTTCTAGT 
CCAAGAGGAA 
TTGGTTTGAA 
AGGAGGAAGG 
GAGACTATTT 
AAGAAAGGAA 
GTAGACAGAA 
AATCTCCTCC 
AATAAAATGT 
AAGGAAGTGA 
GTAATGACAG 
GGATTCCTGG 
CAAGTGTTCA 
TCAGGATATG 
TAGGAGAACT 
CAAGCTTTCT 
TTCAACCTTC 
CCATAGATTG 
CCTCCATTCC 
TGGTACCCGA 
CTGGATGCAG 
TTTCCTCTTC 
CTATTCCCCG 
ATATATATTG 
GTGAGAAATT 
CCTATGTGTT 
AAAACAAACT 
TGTGGAGAAA 



11 
I 

CCATCGGGGA 
AAAAGGGAGA 
TTAGGGAGAG 
AGCATACAGT 
GAGGCAAGAG 
CCCTCTCTGC 
AGCTAGTTAG 
TCCTTGGGAA 
ACTAACCAGT 
TCTCTTGACT 
GGTCCAGGAA 
GATATTTCCT 
AGCCAATGAA 
TATGCAAAAA 
TCCAGTCTCA 
ATTTAGGAAC 
CTAAATTTAA 
AGGGCAAACC 
GTCCCCTGTA 
CAGGATGAGC 
GTAAAT CCAT 
ACTCAGCTGA 
TTTCTTTTTC 
ACTTCAATCA 
ATACAGGAGA 
TCCAGATTGG 
TCTGGCACCT 
CACGGCTGGT 
TCAGAACTCT 



21 



AAATCCATAG 
ACATCAATAT 
AGTTATAAGA 
AAATATGATG 
ATAATATCAT 
TTTTCAAACC 
TCTTGTTCTG 
TACAGTAATT 
TTCCCTATAG 
TTGTTACTTA 
AATCTAGGAG 
GAAAGTGTAA 
GTTGGTGTAT 
CTTCTTGGAA 
CACACCAGGA 
AGAAAAAAAT 
GCAAACTCCT 
TCCGTGCCTC 
ACCCCGGTTT 
TTGTTGCTTC 
CCTACTCCAA 
GAAGACCATT 
TTCTATCTTT 
GGGAACTTAT 
CCTAAGAAGA 
AAACACAGCT 
TGTTGTAGAT 
GTTAAAAAGG 
ATTCACGGT C 



31 
i 

TGCAGATAAA 
AGGATGTTTC 
GATCAGCAAG 
TCTGTCCCTG 
TTTCTCTGTG 
TTACTGGAGT 
AGGTTGTTCA 
GACATATATT 
ATTGCCACAA 
ACAATGCTGA 
ATATTTCTTA 
TTTCCCATTG 
GTTTATGAAA 
TTTCTGAGTT 
TATGTCCTTT 
GCCTGAAATG 
GGTCATTTTC 
AGACGTTTAG 
GTCTCAGCTT 
TGTCCTATGA 
TAGAGGAAGG 
ATTCATTTTT 
GGATTTTTAG 
ACCTCTTAAA 
GCATGTCTTG 
TCCTTTCTCC 
AAATCTCCCT 
GCCCATGACA 
GGTTGGAATG 



41 

1 

GCAAGGAGGA 
T TAG CAAT AG 
GGGACAGGGT 
GCAGTGTTGG 
CTCCAACTGT 
TGTTTTCCCT 
ATGTATACAT 
CTGTTATTTG 
GCACATAATA 
GAAAACTTTA 
ACCAATCTAT 
AGGATTTGTT 
TATCAAGAGA 
CTCTGTGGCA 
CTAGCCTGTC 
ATTTCTCATT 
AGTTAGTACC 
CCATAGTCTG 
GTTATCCTGT 
GACATTAGAT 
TCCATTTTTG 
GGAATTCTTT 
TCCATCAACG 
CTCATTCAGA 
GGGGTTGAGG 
CATCCAGCCC 
TGACTTTGTG 
ATACCAAGTG 
CACACTTGTG 



51 
1 

AGAAGAAGGA 60 

AAAAAGAAGG 12 0 

TAGATTTGGT 180 

CAGAGTAGGA 240 

ACTTACATAT 300 

CATGAAAACC 3 60 

ATCTATATCT 42 0 

ATGCTTGAAA 480 

AGAAACAATA 540 

CAGCCTTCAT 600 

AAAGGCATTA 660 

TTTAATTTCT 72 0 

CATAAGTTGG 780 

ATATATGACA 840 

TATCACATGC 900 

TGAACTCATC 960 

TTTCCTTAAG 1020 

AAATTCTCTT 1080 

TTTTTTCTTC 1140 

TCCTTTTCTT 1200 

TCTTATAGCG 1260 

ATCTCAGATA 132 0 

CCCCATTAGT 1380 

GACTCAAAAC 1440 

AAACAGGCAG 1500 

CTACTTTCAG 1560 

ATGTGCTGAG 1620 

TTGGGGAGAA 1680 

CAGAATTCTA 1740 
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TGGAGAAGAG TCTGGCATTT CCTCAAAATG TTAACCTGGA TTTACCATAT GACCCAGCGA 1800 

TTTCATTCAT AGGTTTATAC TCAAAAGAAA TGAAGAAATA TGCCATGCAA AAAAATGTAC 1860 

ATGAAAGGTC ACAACATCAT TATTCATAAT AGTAAAAGGA TGGAAACAAC ACAAATGTCC 1920 

AT CAACTTAT GATTAAAGAA AATCTGGTCT AT T C AT AG AA TGGAATATTA TTCGACCACA 1980 

AAAAGGAATG ATGTACTGAT CCATGCAATG ATGTGGACAA ACCATGAAAA TAACACTAGA 2 040 

TTAAAGAAGC CAGTCACAAA AGGACTTACT GTATGATTCC ATTTACCTGA AATGTTTGGA 2100 

ATAGGCAAAT CCATAGAAAC AGGAGGTAGA TTCCTGGTTT CCAGGGTCTC CAGGAAGGGA 2160 

AGAATGAAGT ACAAGATTTC TTTTGGAGGT AGTGAAATTG TTGTGGAATG AGATCATGAT 222 0 

GATGATAGCA CAACTTTGTG AATATAATAA AATCATTGAA TTGTACAGTT GAATTTATGG 2280 

TATATAAATT ATATGTTAAT AAAAAGGGGG TCCACAAAAC AAACAGCCCC CCACTCTGGT 2340 

TGTCAGGGAG ATATTGGATT AAATGGCCTT GGACAACAAC CCCTCTCCCT GGCCACAGAC 2400 

AT T CT T C AG A TTACAAGATA TTCCAGGGGA AACACTGGAA TGAGTCTGAA GCCAGGTGCT 2460 

AAACAGAAGG ACCATTGAGA AATGTTGTGA TCCTGACAGG TCAAGCAATT TATTTTTCGG 252 0 

CTTCATTTTT AAATGTAAAA TTAGAAAGCT GCCATTTAAA ATGGCCCGTC TGTTTCAATT 2580 

GCTCTTCTCA GTGTCAGCCT GTTAACTCAA TGTGTTAGTC TGTTTTCATG CTGCTGATAA 2640 

AAACATACCT GAGACTGGCA AGAAAAAGAG GTTTAATTGG GCTTAGAGTT CCACGTGATT 2700 

GGGGAGGCCT CAGAATCACA GTAGGAGGCA AAAGTTATTC TTACATGGTG GCTGCAAGAG 2 760 

AAGATGAGGA AGAAGCAAAA GAAGAAACCC CTGATAAACC CATCGGATCT CCTGAGGCTT 2 820 

ATTAACTATC ATGAGAATAG CACAAGAAAG ACCGGCCCCC ATGATTCAAT TACCTCTACC 2880 

TGGGTCCCTC CAATAACATG TGGAAATTCT GGTAGATACA ATT C AAGTTG AGATTTGGGT 2 940 

GGGAACACAG CCAAACCATA TCACTCAGCA AGGCAGATAA CTTTCTCACT GAG CCT ATGC 30 00 

AACAGAAAAC CATCTGGGAT GGTTGTAAGG GGCACAGGAA GTGACTGGTA GGATCACTGC 30 60 

CAAAGCTGAG CACTCAGGAG AAGGCAATAG AAT CCTATT C TCCATAGTAT G CT ATAAGAT 312 0 

ACTGAAGTAC ACTTCTTCAC TATCT CTTTG GACTTAGAAT TAGCACTACA TTCCTTGTTA 3180 

TACAGAAAAA TTACTAAGGA AATTCATAGG ATGACAAAAA CTTTCAGAAC TGAAAAACAG 3240 

GAAATGTAAG CTTTTTAGTT CTTTGGTATT CGAAGTATGC CTAAAAGACA ATGCAAAATC 3 3 00 

CAAGAAAAGA ATGGTGGGGT TTTTGTTTGT TTGGTTTTGT TTTTGTTTTA CAG CTGGAGT 3360 

AGAATACAAA GGGATGGAGT TGAAACAAAT GAGAGGAAAT TGGAATTCTA AACTTATTCT 3420 

CATTGGCATT AGAAAGGCAC CTACATGTAT TTCACATGAG CCGGTGACTG CTGACTTGCA 3480 

TTCTTATTTT TTCCCTATAG ATTAAAAAGG AGGTACAATG GTAGAACTGT AATCCTGTCC 3540 

TTTGTCATAA ATTTTCATAT TCATAAAGGT GAGTGTTAGC CCGCTTGTGA AATCTGAAGT 3600 

TGAGTAACTT CAAATACTAA CCACAGAGGG AAAGGCAGCA AGAGGAGAGG CATAAATTTA 3660 

GGATCTCACC CTTCATTCCA CAGACACACA CAGCCTCTCT GCCCACCTCT GCTTCCTCTA 372 0 

GGAACACAGG TAAGAGCTTC AAGCCTCTCC AGCTTAATAA CATGAATTAT TTTTGAGAAT 3780 

AATAATGATA CTGTGTTCTA TAT C ATGCAT CTCCTGCATT CTGTCTGATT ATATTTTACT 3840 

TATTCTGCCA GAGCAAAATT AAAATACCTA TTTCATCTGA TTTGTCCTTT AT CTAAATTG 3900 

CTTAGTTCCA AGTAAACCAA GGCACTTTTA GGAACACAGA GGGAGAGTGC CTTGCAGCCA 3 960 

GAGAGTCTTG AAGGAGATGT CAGGGACGCA TCTTAACAGC TGGTTGGATG TGATCCACAG 402 0 

AGGTCTCCTG TTAGCATTCA TTGTAAAGCC ATCCTACCTA GCTCTAGTGT AACCAGCAAT 40 80 

GAAAGAAAGA TAAAGAGGGT CGATTACTTA TTTACAATAG TCTTTAAAAA CGTAGTTTTG 4140 

TAAGCCTTCT AATTAGGACA TTAATATATT TAATATATGC ACATTGTAGA AAGATTGAAG 4200 

CGTTAAAAAT AAGAGAAAAA CTTTAAATGT CAAAATCTCA CAACCCAGAT ATATCATTTC 4260 

TTTAAGAAAA TTGTACTACA AAATACCATT CCATTTATTA AAGTCATTCT GACAGGAATC 432 0 

TGATGCTTTT CCAGGAGTTC CAGATCACAT CGAGTTCACC ATGAAT TCAC TCAGTGAAGC 4380 

CAACACCAAG TTCATGTTCG ATCTGTTCCA ACAGTT CAGA AAATCAAAAG AGAACAACAT 4440 

CTTCTATTCC CCTATCAGCA TCACATCAGC ATTAGGGATG GTCCTCTTAG GAGCCAAAGA 4500 

CAACACTGCA CAACAAATTA GCAAGGTAGC TATCAGCATC ATTACGTTGT CCTGTTGCAG 4560 

TTTTTCTCTG GTTCCGTCGG CTAGCACGCA GATGGTAATA GATGTGGTGG TCTGATGGGT 4620 

AGCACAGGGG GCTGTGCAGG AATTCCCATA ACTGTGAGAC CACTGACTTA AACAGATCTT 4680 

TTGAGTAAAG TTTTCTTGTC CCGCTTCATG TCTCTTCCAG GTTCTTCACT TTGATCAAGT 4740 

CACAGAGAAC ACCACAGAAA AAGCTGCAAC AT AT CATGTG AGTCACAGAG CACTCTGATT 4800 

CAGCTTTAGA TCCCTGAACA GGT CATAGTT TAAACCTGGA ACTTCACAAA AACTAAGAAA 4860 

AGGCCAGTTT TAGGGAAAAT CTTGGACACA AAGATTGAGA CATACAGAGT GGGTTGGCAT 4920 

TTCATGGCAC ATAATTATTA TTCCTCATTT CTGCGTTACT AAAAGACAGT CAGCACTGTA 4980 

CCTCAGAGCA T AGGT CTGGA TCAGGATAGG CTGGGTTCAG ACTCCAGCTT TGCTCTTCAC 5040 

AAATGATGAA TAAGAGCAGG ACACAACTGC TCGGAGTCCC AGTGACCTCA TCCCAGAAAA 5100 

CTAAGGGTAA GAAAAAATCT GACTCAATAC ATGCAAATAC ATGCAAATGT TTACAACAGT 5160 

GCCTTGCCCA T AAAAGT CAT AATAAATGTT ATTATTATTA TAAAGTAGCT ATAATTATAC 522 0 

T AAT CAT AAT AATGTGAAAA TAATTTAATT TTCATTGAGT CATTAATGAG AT TCAG AGGA 5280 

ATAAGCACAA GTCCAAGTAT ATTTTGGAAA ATGATTGCTA TGGAATATAT TGGTTTAGAG 534 0 

CCTTAATAGT GCAAAATGCT TTGCTGGAAG GTAGAAAGTT CTAGATTTAA ACAGGCTTAG 5400 

GTTCAAAACT TGGCACTTCT AATTTATGTC TCTATAAACA GGGTTTTTTT CCCCATTCTC 5460 

TGAGCTTTCT TGTGTTCATC TGAATTGAAC TAAAGACTTA GAGTTACCCA TGTAAAGTCC 5520 

TTAGCCATGG ACCTGGCATA CACTCTTCTT ACGTGCAGAG AATGACCATC ATGAGGAAAG 5580 

AGCCACAGAT CAGT CAATGT GTCCTACAAG ATAATAGCAC CAACAGGTAT AACAGGGCTT 5640 

CCTGGCATAA TCTATTTAAA ATATCCAACC TTCAACATAC TCGTATCCTT GATGACTGTT 5700 

AGAAGTGAAA TATGGTCCTT GCCCATAAGG AGCTGAGAGT TTAACTGGGA AGCTAAACCT 5760 

AACCCTTTAA ACCAACAAGG AGAAAATCTA CTGGTAGACA GCGCTGCATC TTTAGTT CAG 5820 

AAGAGAAAAG ATTGCAGTAC GTTAGAGCAA GAAGAATTTT CTGGAAGAAG TCAAATATAA 5880 

GGTGGATTTT GAAGGGTATT TGAGGTGAAA TACACCAATT ATCAGGGAAT AACATCAAAG 5940 

GTCCTCAATG AGACTACCAG CATT TAGGG A CTGATCTAAC AGACTTAGCA TGGGTTTAGT 6000 

ATTTACATTG ATACAGCAAT TGAATGAT CT CCTTTTTTGA TGTTTGAAGG TTGATAGGTC 6060 

AGGAAATGTT CATCACCAGT TTCAAAAGCT TCTGACTGAA TTCAACAAAT CCACTGATGC 6120 

ATATGAGCTG AAGAT CGCCA ACAAGCTCTT CGGAGAAAAG ACGTATCAAT TTTTACAGGT 6180 

AATTTCACCT GGCCTACCCA CATTTCATTT GCATCCTGAT GTCTGTGTCT CTGAGTGGCC 6240 

AAATGGAAGA AAGCAAGGCA GATGAGCCTG GCCGACCCAG GTGGAGAGCA TTTACTCAGA 63 00 

GTGCATTAGC TCCATTTCCA CAACTCTCCC CCACTGGAGT GTCCCAGACC CCAACGATAC 63 60 

ATCACTGAAG TGTGGATTTA GGGATAATCT TGTGATAAAA GAGGAGGTTG TGTAATAGAG 6420 

TGAGTAAGAG TAATAAGTAA TAAGATACCA TCGATAAACT GGCACTGACT CAGT CA CAT A 6480 

CGATACATCT TGGTGGGAAA TGTATGACTA ATGGGATATT ATTGGAATGG GCAGGCTTGG 6540 

GTGAGTTCCT GAGAATAGTT GAGGAAGTAC CAGGAAATAT TGAATGCACA GGATGAAAGA 6600 

CAAAAACAAA GATCAGAAAC ATCATGGTTA AAATTACTGG AGAGAAGTCT GAGAAGCAAT 6660 

GAATCTCCTT CAGGGAAGCC TGCTCTGCAG TTTGCAAACC ACAGCCTCTT CTGCTTCTGC 6720 

CTTTTGCCAA GATGATATTG ACCTTCAGTG ACCTCTTTCT TGTGCCAGCC CACATTCCCC 6780 

TTTTGCATTG C CT A CATGAC ACCTGTATAA AAATATCCAT GGACAGGAGA TACTGCATCT 6840 

ATTCAGGGTC TGGATTCAGC TTACTGTTGT TACAAATAAG TAAGTTTGGT AATATATAGT 6900 

TACATAAATT ACTCCTAATT CCTACTTCTT CCTTCATATC TCAAAGGAAT ATTTAGATGC 6 960 
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CAT CAAG AAA TTTTACCAGA CCAGTGTGGA ATCTACTGAT TTTGCAAATG CTCCAGAAGA 702 0" 
AAGT CGAAAG AAGATTAACT CCTGGGTGGA AAGT CAAACG AATGGTAGGA GAGCCACCCA 70 80 
TTATAGAAAC ACCTTTGAGA AACCTATGCC AGTGAGCCTT GTGCTTGACA CTGCATGGGG 7140 
GAACAGGTGT GGGGATTGAG ATGGGTTTGC AGGGAGGGCT GAAGAGGGCA CTCCAGATGA 7200 
AGGATTTGTC CAAATGAATA TGAAGAGAGC CTAGGGGAGC CAAGGAGGAA AT CACAGGAA 7260 
GCCAATTAGA TGGAAACACA TCTGGAGAAT TATTTGCTTA TGGCCCTGCA TGACAATAGC 7320 
TTTGTGGATC CCCTGTCTCC GCTCAGACCT ATTTTGAGAT CATAT CCTTT ACTTTAAATC 73 80 
AGACTCAAAT TTTTATGATG AATATTTAAT AGAAAACATT AGAAAGCGTC TCTCGTCTCC 7440 
TTTACTAATT GGGAAACAAG CAGCTCTCTG GTAAATCACC CTTTTGTCTC TGAGCTGGAG 7500 
CTGCCTGGAT CACATCTGTA GCCAATGTGT TCTGCAGGGA TTATCACAGC TCTCTTCCCC 7560 
AT CAAGGGCA AAGAGCTTGA CAAAGTCTCC ATTCTACAGA CATCTTTCTT ACCTCCCACC 762 0 
TCTCATTACA GGCCAAACTT ACAGCAACTC AACATGAGAG TGAATAGGAA GATACCCCCG 7680 
GAAGTAGTGT CTGACAGCAC AGGACATGCG TTTCATATTA CAGAGCTCAA GTCACTCATC 7740 
CTAAAATGCA ATCAGGGCCT CCTTCCTCTG AATGGGGACC CCGTAGTTAA AAAAAAATAA 7800 
AAGTAGGAAG AGGAGGGAGG GAGAAAGGAA AGACACATGT TGGAAGAGTA GACAAAATCA 7860 
GTTTATCAGT ATTCCAAATC AGATGATTGG AGACATTCAT ACACAGAGAA CGTGAACTCC 792 0 
TTCTCTATCA CAAGAAGTGA TGTCTCCATC AAGGGTAACT TTATACGACT GGAGCCTTGA 7980 
AGAAAGCTGC AT CTGGTGAA CCACTGGTCA GTGAGTCTAA CAATTCAAAG ATCAAAGTCA 8040 
GTGAGTCTCA AGCAGGGATT TGGGTCAATA ATTAACGATC AGT CACGAAC ATTTGCAAAG 8100 
CATCTTCCAG ACAAGCCATT TGTAGCTTGT GTAAAAGACT CTTTTATTCT TTCCCTTGCA 8160 
GAAAAAATTA AAAACCTATT TCCTGATGGG ACTATTGGCA ATGATACGAC ACTGGTTCTT 8220 
GTGAACGCAA TCTATTTCAA AGGGCAGTGG GAGAATAAAT TTAAAAAAGA AAACACTAAA 8280 
GAGGAAAAAT TTTGGCCAAA CAAGGTATTG TCTATATTTT ATTTATATAG TGTAATATGT 8340 
TAATACATGG AATGTTAAAC ATTTCTGATG GAATGTAACA TGATAAGTAA AAAATAAAAA 840 0 
TTGTTCATGT CTGTTATTTT GTTGTTTTAC TCTTATAACT T TAT T T AGT T AGGAATACCT 8460 
GAAAAACTAT TGTTTCTAAC TCATGGAATT CCTGGGTTAT TTCTTAGAAG AAGAAGGATG 852 0 
TGTTGCTATC TCAATAATAT TATCTTTTTT GTCTTGTGTT TCACGTGTTA TTTGTTGGAC 8580 
ACATTGATTT ATTGCAGAAT ACATACAAAT CTGTACAGAT GATGAGGCAA TACAATTCCT 864 0 
TTAATTTTGC CTTGCTGGAG GATGTACAGG CCAAGGTCCT GGAAATACCA TACAAAGGCA 8700 
AAGATCTAAG CATGATTGTG CTGCTGCCAA ATGAAATCGA TGGTCTGCAG AAGGTAAGAA 87 60 
CTTGCAT CTA CAACTCTTCC TTCTACTGCC GGACATTTTT C CAAAG AT AC C AAGT T T AAA 8820 
CAAGGTAAAA GCTTATGACC GAGTTGCCTC AAAATGATGA AAAATTCTAA ATGAGGAATG 8880 
ATGACTCACC TTCATATTAC AAATATTTGA GCATAGGGCC TGACACAAAC TGAAAGCTTA 8 940 
GTTTTTGTTT GTTTGTTTGT TTTTATTATT ATTATTATAA TACTTTAAGC TTTAGGGTAC 90 00 
ATGTGCACAA TGTGCAGGTT AGTTACATAT GTATACATGT GCCATGCTGG TGTGCTGCAC 90 60 
CCATTAACTC ATCATTTAGC GTTAGGTATA TCTCCTAATG CTATCCCTCC CCCCTCCCCC 912 0 
CACCCCACAA CAGTCCTCAG AGTGTGATGT TACCTTCCTG TGTCCAAGTG TTCTCATTGT 9180 
TCAATTCCCA TCTATGATTT AATTCCATCT ATGGCTTAGT TAATGATTAA TTTATTAGAG 9240 
TTACATGCAT TGGATAT CAA TTTGATGATA TTATTATGCA GCAATTTAAA CTTGACTGGG 93 00 
AGAAATATAT ACCAATGTGA GGAAAGTTTA CAAATAGGCC GAGTAGAAAA GGGAATACAA 93 60 
ATTTAGGAAT TTAGGGAATT ACAATTTAAT AATTGCAATG TGTACTAAAT AATGTATACA 9420 
GAAAAATATG ATGAGCCTAT TAAAAATTGA CACATGTAGT AGGCTGTTGG CACAAGAAAT 9480 
AGTGATACAT ACAGTTCATT GTGTACAAAA TAATGTAATC ATATTTTACA TGTGTATCAT 9540 
ACAGTTGTAT ACATACATAT GTACACATAT ACATATACGT AAAAACATGA TTCTGTTTTT 9600 
ACATACATGT ATATACATAT ACACATATAA CCCAATGTAT TTATATATTC AGGACTCATA 9660 
TTTTACCTAT TAGAATAATA ATGTCTATTA AAGTGAACCT TCTGTATTTC ACATTTATTG 9720 
CCAAAATAAC GAATCTCCAC ATAGTCAATT CATTGTTAAG GTGTATTAGA GATCGACAGT 9780 
T AGT CATAT C AGTTTCTTTT TTCCATTTGT ATAGCTTGAA GAGAAACTCA CTGCTGAGAA 9840 
ATTGATGGAA TGGACAAGTT TGCAGAATAT GAGAGAGACA TGTGTCGATT TACACTTACC 9900 
TCGGTT CAAA ATGGAAGAGA GCTATGACCT CAAGGACACG TTGAGAACCA TGGGAATGGT 9960 
GAATATCTTC AATGGGGATG CAGACCTCTC AGGCATGACC TGGAGCCACG GTCTCTCAGT 10 02 0 
AT CTAAAGT C CTACACAAGG CCTTTGTGGA GGTCACTGAG GAGGGAGTGG AAGCTGCAGC 10 080 
TGCCACCGCT GTAGTAGTAG TCGAATTATC ATCTCCTTCA ACTAATGAAG AGTTCTGTTG 10140 
TAATCACCCT TTCCTATTCT T CAT AAGGCA AAATAAGACC AACAGCATCC TCTTCTATGG 10200 
CAGATTCTCA TCCCCATAGA TGCAATTAGT CTGTCACTCC ATTTAGAAAA TGTTCACCTA 10260 
GAGGTGTTCT GGTAAACTGA TTGCTGGCAA CAACAGATTC TCTTGGCTCA TATTTCTTTT 10320 
CTATCTCATC TTGATGATGA TAGTCATCAT CAAGAATTTA ATGATTAAAA TAGCATGCCT 10380 
TTCTCTCTTT CTCTTAATAA GCCCACATAT AAATGTACTT TTCCTTCCAG AAAAATTTCC 10440 
CTTGAGGAAA AATGTCCAAG ATAAGATGAA TCATTTAATA CCGTGTCTTC TAAATTTGAA 10500 
ATATAATTCT GTTTCTGACC TGTTTTAAAT GAACCAAACC AAATCATACT TTCTCTTCAA 10560 
ATTTAGCAAC CTAGAAACAC ACATTTCTTT GAATTTAGGT GATACCTAAA TCCTTCTTAT 10620 
GTTTCTAAAT TTTGTGATTC TATAAAACAC AT CAT CAAT A AAATAATGAC ATAAAATCAT 10680 
TTTTGCTTTA CCTGTTTTCT CTCTGGAAAG GGCAAGTGTC CAGTTACACA TAGGAAAGAT 10740 
AATTTAGAGA TATATTAATC ATATATAAAG GAAAATTAAA AACAGAGTAG TTCATGATGA 10 80 0 
GCCTGGAGTA GAAGGCATAT CCCAGAACAG GAGGAGCCTT GTAAACCACA TAGGAACTTC 10860 
CTATTTTATG CTAAAGGGAT AAGAAACTCA TTACAGGCTT TGATGGTTGT TTGTCAAAGA 10 920 
GGGGCATAAA ATTATCATAT CCACATCTAG AAAATACATC TCTGGCTACG CTGATATCAA 10980 
TGGATGCGAG GAAAGAACAG TGTGGTTACC ATATATAAAT TAGGAAATCA TTAGAGTATT 11040 
GGGAGTGGAA ATGGAGAGAA AGAAAGAGCC TGGGGGAATT ATTTAGGAAA TAATAGTTAC 11100 
AGAAAGACAT CTAAGTTGCT GACCTATCTG ACTGGATGGA TGGAAGAATA TCTTGTTTCT 11160 
GAGAGAAAAA AAGACTTTGG GTTTAAATTT GTACTTGATG AATTAAGGTA CTTTTAATAT 11220 
TCAAATGGAT TTGCCTGGCA GGCACTTGAA GATATTAGTC TAAATCTCAG AAACAGAATA 11280 
TGATCTGAAG CTCTAAATTT GTGATATTCA ATATAAATAC TTTAGAGTCA TTGGGATAAA 11340 
TATGGTAGTT GTAGCTAAAA GCAAAAATAA GATACTAGGG AGAAAGGATA AAGTTAGAAG 11400 
AAAGAAGAAT CTAGAATTGA CCTTGAAGTA TATCAG CATG TGTAAAGATC AGGAATTGAT 11460 
CATTTTTATT TTCCAGAAAG TAGCTTTTCT TAGGGTTCCA TATTTACTCC CATAGATTCT 11520 
TCCC 

Seq ID NO: 465 Protein sequence 
Protein Accession #: BAB21525.1 

1 ll 21 31 41 51 

l I l I I I 

MNSLSEANTK FMFDLFQQFR KSKENNIFYS PISITSALGM VIiLGAKDNTA QQISKVLHFD 60 

QVTENTTEKA ATYHVDRSGN VHHQFQKLLT EFNKSTDAYE LKIANKLFGE KTYQFLQEYIj 120 

DAIKKFYQTS VES TDFANAP EESRKKINSW VESQTNEKIK NLFPDGTIGN DTTLVLVNAI 180 

YFKGQWENKF KKENTKEEKF WPNKNTYKSV QMMRQYNSFN FALLEDVQAK VLEIPYKGKD 240 
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LSMIVLLPNE IDGLQKLEEK LTAEKLMEWT SLQNMRETCV DLHLPRFKME ESYDLKDTLR 
TMGMVN I FNG DADLSGMTWS HGLSVSKVLH KAFVEVTEEG VEAAAATAW WELSSPSTN 
EEFCCNHPFL FFIRQNKTNS ILFYGRFSSP 
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Seq ID NO: 466 DNA sequence 

Nucleic Acid Accession #: NM_001910 . 1 

Coding sequence: 50.. 1240 



10 



15 



20 



25 



30 



35 



40 



45 



GGAGAGAAGA 
CCTTCTTTTG 
GCCCCTCAGG 
GTTCTGGAAA 
GAGTGCCAAG 
TGGCTCCCCA 
CCCCTCTGTG 
GTCCAGCACA 
GTCCGGGATC 
GTTTGGAGAA 
TCTGGGCCTG 
GATGGCTCAG 
AGGTGGTGCG 
CCTGAATTGG 
GGTGGGAGGC 
TTCCCTCATC 
CCCCGTGGAT 
CTTCACCATT 
CGTGGATGGA 
TGGGCCCCTC 
TGGGAATAAC 
CCTGCCTGTC 
GTTATTTTCC 
ACATGAGAAT 
ACTCCCACCA 
TGATTATGAA 
GCAGAGATCA 
CACACGGCCA 
GTACCTGGAT 
TAACATCCTT 
CTGTTTTTGT 
TTTGAAATGT 
TTGAAATCCC 
AGTTAGATCT 
CTTGTTGCAT 
CTGCTGGGTG 



11 

I 

AAGGAGGGGG 
CTGCTGGTGC 
AGGCATCCGT 
TCCCATAATT 
GAACCCCTCA 
CCACAGAACT 
TACTGCACTA 
TACAGCCAGC 
ATTGGAGCCG 
AGTGTCACAG 
GGATACCCCT 
AACCTGGTGG 
GGGAGCGAGC 
GTCCCAGTCA 
ACTGTTATGT 
ACTGGCCCTT 
GGAGAATATG 
AACGGAGTCC 
ATGCAGTTCT 
TGGATCCTGG 
CGTGTGGGAC 
TGACAGACCT 
AGAGAATGTA 
ACACACACAC 
CCGTCATGAT 
AATCAAAAAT 
TGGTATAATA 
GGCCTGTTTA 
CATTCTGAAG 
AAATATACAA 
AGTTGGATTG 
CTGTAAGTCT 
GAGGTGTCAT 
GGAGGTCTGA 
CCTGTCAGGA 
GGTTTGGAGT 



21 



CAAGGGAGAA 
TCCTGGAGCT 
CCCTCAAGAA 
TGGACATGAT 
TCAACTACTT 
TCACTGT CAT 
GCCCAGCCTG 
CAGGTCAATC 
ACCAAGTCTC 
AGCCAGGCCA 
CCTTGGCTGT 
ACTTGCCGAT 
TGATTTTTGG 

ccaagcaagc 
tctgctccga 
ccgacaagat 
ctgtggagtg 
cctat'accct 
gcagcagtgg 
gggatgtctt 
tggccccagc 

TGAATATGTT 
GCTGTTTCCA 
ACACACATAT 
GGAGGAATTA 
TTTCACATTT 
AATCCCTTTG 
TCTACACTGC 
CAAATT CCGA 
TCGGAATTCA 
TTTGTATTAG 
CTTTCCATCT 
TTGACATGGT 
TTTTGTGGCA 
GGCAGATAAT 
TCTTGGCTTT 



31 
I 

GCTGCTGGTC 
GGGAGAGGCC 
GAAGCTGCGG 
CCAGTTCACC 
GGATATGGAA 
CTTCGACACT 
CAAGACGCAC 
TTTCTCCATT 
TGTGGAAGGA 
GACCTTTGTG 
GGGAGGAGTG 
GTTTTCTGTC 
AGGCTACGAC 
TTACTGGCAG 
GGGCTGCCAG 
TAAGCAGCTG 
TGCCAACCTT 
CAGCCCAACT 
CTTTCAAGGA 
CAT TCGACAG 
AGTCCCCTAA 
AGGCTGGGGC 
GGGTTGCAAC 
ACACACACAC 
CGTTATACAT 
GATTATGAAA 
CAACTCCACT 
TGCCCACTCC 
GCATTACATC 
AGCATCTCCC 
G ATT CAAGCA 
ACAGAGTTTA 
TCTCTGAACT 
AAAATACTTC 
GCTGGTGCCT 
AATCATTCAT 



41 
I 

GG ACT CACAA 
CAAGGATCCC 
GCACGGAGCC 
GAGTCCTGCT 
TACTTCGGCA 
GGCTCCTCCA 
AGCAGGTTCC 
CAGTATGGAA 
CTAACCGTGG 
GATGCAGAGT 
ACTCCAGTAT 
TACATGAGCA 
CACTCCCATT 
ATTGCACTGG 
GCCATTGTGG 
CAAAACGCCA 
AACGTCATGC 
GCCTACACCC 
CTTGACATCC 
TTTTACTCAG 
GGAGGGGCCT 
ATTCTTTACA 
TTGAATTAAG 
ACACTTCACA 
TCATATTTTG 
ATCTCCAAAC 
CAGCCCTGAC 
TCTCTCCAGC 
ATTTTGTCCA 
ATTGTCCCAC 
AGGCCCATAT 
GCACATT TGA 
TATCTTTCCT 
CTAGGTGGTG 
CTCTATTGGT 
TACAAAGTTC 



51 



TGAAAACGCT 60 

TTCACAGGGT 120 

AGCTCTCTGA 180 

CAATGGACCA 240 

CTATCTCCAT 300 

ACCTCTGGGT 360 

AGCCTTCCCA 42 0 

CCGGGAGCTT 480 

TTGGCCAGCA 540 

TTGATGGAAT 600 

TTGACAACAT 660 

GTAACCCAGA 72 0 

TCTCTGGGAG 780 

ATAACATCCA 840 

ACACAGGGAC 900 

TTGGGGCAGC 960 

CGGATGTCAC 102 0 

TACTGGACTT 1080 

ACCCTCCAGC 1140 

TCTTTGACCG 1200 

TGTGTCTGTG 12 60 

CCTACAAAAA 132 0 

ACCAAACAGA 13 80 

CATACACACC 1440 

TATTGATTTT 1500 

ATATGCACAA 1560 

AACCCATCCA 162 0 

TCCACATGCT 1680 

TAAATATTTC 1740 

AAATGTTTGG 1800 

ATTGCATTTA 1860 

ACGTTGCTGG 1920 

ATAAAATGGT 1980 

CTGGGTACTT 2040 

AATGTTAAGA 2100 
AGCATTTT 



50 



Seq ID NO: 467 Protein sequence 
Protein Accession #: NP 001901.1 



55 



60 



65 



70 



75 



80 



85 



11 



MKTLLLLLLV 
SMDQSAKEPL 
QPSQSSTYSQ 
FDGILGLGYP 
FSGSLNWVPV 
I G AAPVDGE Y 
HPPAGPLWII* 



LLELGEAQGS 
INYLDMEYFG 
PGQSFSIQYG 
SLAVGGVTPV 
TKQAYWQIAL 
AVE C ANLNVM 
GDVFIRQFYS 



21 
I 

LHRVPLRRHP 
TISIGSPPQN 
TGSLSGIIGA 
FDNMMAQNLV 
DNIQVGGTVM 
PDVTFTINGV 
VFDRGNNRVG 



31 



41 



SLKKKLRARS 
FTVIFDTGSS 
DQVSVEGLTV 
DLPMFSVYMS 
FCSEGCQAIV 
PYTLSPTAYT 
LAPAVP 



QLSEFWKSHN 
NLWVPSVYCT 
VGQQFGESVT 
SNPEGGAGSE 
DTGTSLITGP 
LLDFVDGMQF 



51 
I 

LDMIQFTESC 
SPACKTHSRF 
EPGQTFVDAE 
LIFGGYDHSH 
SDKIKQLQNA 
CSSGFQGLDI 



Seq ID NO: 468 DNA sequence 

Nucleic Acid Accession #: NM_018058.1 

Coding sequence: 319.. 1575 



11 



TACGCGCTGC 
GACGGCCGGG 
TACACCGACA 
GTCAACGTGG 
AGAAAGGGCT 
CCTGATGCCC 
CTCAGAGATG 
GTGGGCCCCA 
AACTTCCTTT 
GTGGACGACC 
AAAGTGGACA 
ACCCATGGGA 
GTCCGCACGG 
AACATTGCCT 
GGAGACCCCC 
ACAGGGGGTG 
GGAGAGT CCA 
TGGCTGCGAG 
CTCTACACCA 
TGTGAGATGG 
GTGACGTGGC 



GGGACCGGCA 
AGGAGAT CTA 
AGTTGTTCAA 
CCCGTGGTGT 
CTGGACGCTA 
TCATTGAAAT 
TGGCTGCTGA 
TCCTCAGCAG 
TCCACAACCG 
CCCACCAGCA 
TCGTCTATGG 
AGGTCCGCTT 
TCATCACCGC 
ACCGCAGCTC 
TCATCGAGGA 
TGGTGACCGA 
TGGCTCAGCC 
TGGTGCCACG 
AGAAGAGTGG 
AGCCCGTGGC 
CAGATGGCAA 



21 
I 

GGGGAACGCC 
CTTCCTCAAC 
GTTCCGCAAT 
GGCCAGCCTC 
CTCTATCTAC 
GGACCCTGAG 
GGCTGGGGTC 
CAGTGCCTCG 
GGGCGATGGC 
TGGGCGAGGT 
CAACTGGAAT 
CCGGGACATC 
CGACTTTGAC 
CTCAGCCAAC 
GCTCAATCCC 
CTTCGACGGA 
GCTGTCCGTC 
CACCCGGGTT 
GGCCCACCTG 
ACACTTTGGC 
GATGGTGAGC 



31 

i 

ATCGGGGTCA 
ACCAATAATG 
AACCGGTGGG 
TTTGCCGGAC 
ATTGCCAATT 
GCCAGTGACC 
AGCAAATATA 
GATATCTTCT 
ACCTTTGTGG 
GTCGCCCTGG 
GGCCCCCACC 
GCCTCACCCA 
AATGACCAGG 
CGCCTCTTCC 
GGCGACGCCT 
GACGGGATGC 
TTCCGGGGCA 
GGGGCCTTTG 
AGGATCATCG 
CTGGGGAAGG 
CGGAACGTGG 



41 



CAGCCTGCGA 
CCTTCTCGGG 
AAGACATCCT 
GCTCTGTGGC 
ACGCCTACGG 
TCTCCCGGGG 
CAGGGGGCCG 
GCGACAATGA 
ACGCTGCGGC 
CTGACTTCAA 
GCCTCTATCT 
AGTTCTCCAT 
AGCTGGAGAT 
GCGTCATCCG 
TGGAGCCTGA 
TGGACCTCAT 
ATCAGGGCTT 
CCAGGGGAGC 
ACGGGGGCTC 
ATGAAG CCAG 
CCAGCGGGGA 



51 
I 

CATCGACGGG 
GGTGGCCACG 
GAGCGATGAG 
CTGTGTGGAC 
TAATGTGGGC 
CATTCTGGCG 
AGGCGTCAGC 
GAATGGGCCT 
CAGTGCTGGT 
CCGTGATGGC 
GCAAATGAGC 
GCCCTCCCCT 
CTTCTTCAAC 
TAGAGAGCAC 
GGGCCGGGGC 
CTTGTCCCAT 
CAACAACAAC 
TAAGGTCGTG 
AGGCTACCTG 
CAGTGTGGAG 
GATGAACTCA 



60 
120 
180 
240 
300 
360 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
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GTGCTGGAGA TCCTCTACCC 
ACACCAATGA ATGCATCCAG 
ACACCTATGG AAGCTACAGG 
ACGAGGATGG CACAGCCTGC 
CCCCCACCGC TGCTGCTGCC 
CACCGGTCCT CGTAGATGGA 
CCAGCTGCTG AGCAGGGGTG 
AAGTGGGCTT GTGCTGCTGC 
CCCAAGCCCA TCCATGCACA 
CTGTGCTGGG CACATAGCTG 
AT T CCAGTGG GTCTAATGAC 
CTGCACAGGA AGTATGAGGA 
AAAGCTATGT GACCTTACAC 
AAATGGGGAT TAAGAATAGA 
GACACTTGGC ACAAAACCTG 
GGGCTTTGTC AACACGTG 
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CCGGGATGAG 
TTCCCATTCG 
TGCCGGACCA 
GTGGGGACTC 
ACTGCCGCTG 
GATCTCAATC 
GGACATGAAC 
CTAGACAGTA 
TTACTTAGCT 
TGATCACAGC 
CATATCTTAG 
CTTTAGTGTC 
CAGTCACTTA 
ATCTTGGGGT 
GCACATAGTA 



GACACACTTC 
TGTGCCCTCG 
ACAAGAAGTG 
TCGGCCAGTC 
CTGCTGCCGC 
TGGGGTCGGT 
CAGCGGATGG 
GGGATGTAAA 
AACAATTAGG 
AGACAGGGTC 
GACACAGATG 
CTGAGTTCAA 
ACTTGTTAGC 
TAGTGTGGAG 
AAGGCTCAAT 



AGGACCCAGC 
AGACAAGCCC 
CAGTCGGGGC 
ACCGGGCCCC 
TGCTGGAGCT 
GGTTAAGGAG 
AGTCCAGCAG 
GGCCTGGGAG 
GAGACTCGTA 
GCTGCCCTGA 
TGCCCAGGGA 
ATCCTGATTC 
CATCCATTAT 
ATTAGATTAA 
AAAAACAAGT 



CCCACTGGAG 1320 

GTATGTGT CA 13 80 

TACGAGCCCA 1440 

CGCCCCACCA 1500 

GCCACTGCTG 1560 

AGCTGCGAGC 162 0 

GGGAGTGGGA 1680 

CTAGACCCTC 1740 

AGGCCAGGCC 180 0 

TGGCGCTTAC 1860 

GGTGGTGT CA 1920 

AGGAACTCAC 1980 

CGCATCTGCA 2040 

ATGTATGTAA 2100 

GCCTCTCACT 2160 



20 



Seq ID NO: 469 Protein sequence 
Protein Accession #: NP 060528.1 
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30 



35 



40 
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55 



60 



65 



70 



75 



80 



MDPEASDLSR 
RGDGT FVDAA 
FRDIASPKFS 
ELNPGDALEP 
RTRVGAFARG 
KMVSRNVASG 
GAGPTRSAVG 



11 

I 

G I LALRD VAA 
ASAGVDDPHQ 
MPSPVRTVIT 
EGRGTGGWT 
AKWLYTKKS 
EMNSVLEILY 
ATSPTRMAQP 



21 
1 

EAGVSKYTGG 
HGRGVALADF 
ADFDNDQELE 
DFDGDGMLDL 
GAHLRI IDGG 
PRDEDTLQDP 
AWGLSASHRA 



31 

1 

RGVSVGPIIiS 
NRDGKVDIVY 
IFFNNIAYRS 
ILSHGESMAQ 
SGYLCEMEPV 
APLETPMNAS 
PAPPPPPLLL 



41 

1 

SSASDIFCDN 
GNWNGPHRLY 
SSANRLFRVI 
PLSVFRGNQG 
AHFGLGKDEA 
SSHSCALETS 
PLPLLLPLLE 



51 

I 

ENGPNFIjFHN 
LQMSTHGKVR 
RREHGDPLIE 
FNNNWLRWP 
SSVEVTWPDG 
PYVSTPMEAT 
LPLLHRSS 



Seq ID NO: 470 DNA sequence 
Nucleic Acid Accession #: AJ279016 
Coding sequence: 1..1962 



1 
I 

ATGT CCAGGA 
CAGCGGGCTG 
AGTAATCCCA 
TTTGAGATCG 
CAGAAGCGGC 
GACCGGCAGG 
GAGATCTACT 
TTGTTCAAGT 
CGTGGTGTGG 
GGACGCTACT 
ATTGAAATGG 
GCTGCTGAGG 
CTCAGCAGCA 
CACAACCGGG 
CACCAGCATG 
GTCTATGGCA 
GTCCGCTTCC 
ATCACCGCCG 
CGCAGCTCCT 
ATCGAGGAGC 
GTGACCGACT 
GCTCAGCCGC 
GTGCCACGCA 
AAGAGTGGGG 
CCCGTGGCAC 
GATGGCAAGA 
CTCTACCCCC 
TTCTCCCAGC 
GTGTGCCCTC 
AACAAGAAGT 
CTCGGCCAGT 
GCTGCTGCCG 
CTGGGGTCGG 
CCAGCGGATG 
AGGGATGTAA 
TAACAATTAG 
CAGACAGGGT 
GGACACAGAT 
CCTGAGTTCA 
AACTTGTTAG 
TTAGTGTGGA 
AAAGGCT CAA 



11 
I 

TGTTACCGTT 
AACCCATGTT 
CCCAGCTCAA 
TCGTGGCGGG 
TGGTGAACAT 
GGAACGCCAT 
TCCTCAACAC 
TCCGCAATAA 
CCAGCCTCTT 
CTATCTACAT 
ACCCTGAGGC 
CTGGGGTCAG 
GTGCCTCGGA 
GCGATGGCAC 
GGCGAGGTGT 
ACTGGAATGG 
GGGACATCGC 
ACTTTGACAA 
CAGCCAACCG 
TCAATCCCGG 
TCGACGGAGA 
TGTCCGTCTT 
CCCGGTTTGG 
CCCACCTGAG 
ACTTTGGCCT 
TGGTGAGCCG 
GGGATGAGGA 
AGGAAAATGG 
GAGACAAGCC 
GCAGTCGGGG 
CACCGGGCCC 
CTGCTGGAGC 
TGGTTAAGGA 
GAGTCCAGCA 
AGGCCTGGGA 
GGAGACTCGT 
CGCTGCCCTG 
GTGCCCAGGG 
AATCCTGATT 
CCATCCATTA 
GATTAGATTA 
TAAAAACAAG 



21 
I 

CCTGCTGCTG 
CACTGCAGTC 
CTATGGTGTG 
GTACAATGGA 
CGCGGTCGAT 
CGGGGTCACA 
CAATAATGCC 
CCGGTGGGAA 
TGCCGGACGC 
TGCCAATTAC 
CAGTGACCTC 
CAAATATACA 
TATCTTCTGC 
CTTTGTGGAC 
CGCCCTGGCT 
CCCCCACCGC 
CTCACCCAAG 
TGACCAGGAG 
CCTCTTCCGC 
CGACGCCTTG 
CGGGATGCTG 
CCGGGG CAAT 
GGCCTTTGCC 
GAT CATCG AC 
GGGGAAGGAT 
GAACGTGGCC 
CACACTTCAG 
CCATTGCATG 
CGTATGTGTC 
CTACGAGCCC 
CCGCCCCACC 
TGCCACTGCT 
GAGCTGCGAG 
GGGGAGTGGG 
GCTAGACCCT 
AAGGCCAGGC 
ATGGCGCTTA 
AGGTGGTGTC 
CAGGAACTCA 
TCGCATCTGC 
AATGTATGTA 
TGCCTCTCAC 



31 
I 

CTCTGGTTTC 
ACCAACTCAG 
GCAGTTACTG 
CCCAACCTGG 
GAGCGCAGCT 
GCCTGCGACA 
TTCTCGGGGG 
GACAT CCTGA 
TCTGTGGCCT 
GCCTACGGTA 
TCCCGGGGCA 
GGGGGCCGAG 
GACAATGAGA 
GCTGCGGCCA 
GACTTCAACC 
CTCTATCTGC 
TTCTCCATGC 
CTGGAGATCT 
GTCATCCGTA 
GAGCCTGAGG 
GACCTCATCT 
CAGGGCTTCA 
AGGGGAGCTA 
GGGGGCTCAG 
GAAGCCAGCA 
AGCGGGGAGA 
GACCCAGCCC 
GACACCAATG 
AACACCTATG 
AACGAGGATG 
ACCCCCACCG 
GCACCGGTCC 
CCCAGCTGCT 
AAAGTGGGCT 
CCCCAAGCCC 
CCTGTGCTGG 
CATTCCAGTG 
ACTGCACAGG 
CAAAGCTATG 
AAAATGGGGA 
AGACACTTGG 
TGGGCTTTGT 



41 



TGCCCATCAC 
TTCTGCCTCC 
ATGTGG AC CA 
TTCTGAAGTA 
CACCCTACTA 
TCGACGGGGA 
TGGCCACGTA 
GCGATGAGGT 
GTGTGGACAG 
ATGTGGGCCC 
TTCTGGCGCT 
GCGT CAGCGT 
ATGGGCCTAA 
GTGCTGGTGT 
GTGATGGCAA 
AAATGAGCAC 
CCTCCCCTGT 
TCTTCAACAA 
GAGAGCACGG 
GCCGGGGCAC 
TGTCCCATGG 
ACAACAACTG 
AGGTCGTGCT 
GCTACCTGTG 
GTGTGGAGGT 
TGAACTCAGT 
CACTGGAGTG 
AATGCATCCA 
GAAGCTACAG 
GCACAGCCTG 
CTGCTGCTGC 
TCGTAGATGG 
GAGCAGGGGT 
TGTGCTGCTG 
ATCCATGCAC 
GCACATAGCT 
GGTCTAATGA 
AAGTATGAGG 
TGACCTTACA 
TTAAGAATAG 
CACAAAACCT 
CAACACG 



51 
I 

TGAGGGGTCC 
TGACTATGAC 
TGATGGGGAC 
TGACCGGGCC 
CGCGCTGCGG 
CGGCCGGGAG 
CACCGACAAG 
CAACGTGGCC 
AAAGGGCTCT 
TGATGCCCTC 
CAGAGATGTG 
GGGCCCCATC 
CTTCCTTTTC 
GGACGACCCC 
AGTGGACATC 
CCATGGGAAG 
CCGCACGGTC 
CATTGCCTAC 
AGACCCCCTC 
AGGGGGTGTG 
AGAGTCCATG 
GCTGCGAGTG 
CTACACCAAG 
TGAGATGGAG 
GACGTGGCCA 
GCTGGAGATC 
TGGCCAAGGA 
GTTCCCATTC 
GTGCCGGACC 
CGTGGGGACT 
CACTGCCGCT 
AGATCTCAAT 
GGGACATGAA 
CCTAGACAGT 
ATTACTTAGC 
GTGATCA CAG 
CCATATCTTA 
ACTTTAGTGT 
CCAGTCACTT 
AATCTTGGGG 
GGCACATAGT 



Seq ID NO: 4 71 Protein sequence 
Protein Accession #: CAC08451 



51 



85 



1 11 21 31 41 

111)11 
MSRMLPFLLL LWFLPITEGS QRAEPMFTAV TNSVLPPDYD SNPTQLNYGV AVTDVDHDGD 

FEIWAGYNG PNLVLKYDRA QKRLVNIAVD ERSSPYYALR DRQGNAIGVT ACDIDGDGRE 

EIYFLNTNNA FSGVATYTDK LFKFRNNRWE DILSDEVNVA RGVASLFAGR SVACVDRKGS 



60 
120 
180 
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GRYSIYIANY AYGNVGPDAL 
LSSSASDIFC DNENGPNFLF 
VYGNWNGPHR LYLQMSTHGK 
RSSSANRLFR VIRREHGDPL 
AQPLSVFRGN QGFNNNWLRV 
PVAHFGLGKD EASSVEVTWP 
FSQQENGHCM DTNECIQFPF 
LGQSPGPRPT TPTAAAATAA 



PCT/US02/12476 



IEMDPEASDL 
HNRGDGTFVD 
VRFRDIASPK 
IEELNPGDAL 
VPRTRFGAFA 
DGKMVSRNVA 
VCPRDKPVCV 
AAAAAGAATA 



SRGILALRDV 
AAASAGVDDP 
FSMPSPVRTV 
EPEGRGTGGV 
RGAKWLYTK 
SGEMNSVLEI 
NTYGSYRCRT 
APVLVDGDLN 



AAEAGVSKYT 
HQHGRGVALA 
ITADFDNDQE 
VTDFDGDGML 
KSGAHLRIID 
LYPRDEDTLQ 
NKKCSRGYEP 
LGSWKESCE 



GGRGVSVGPI 
DFNRDGKVDI 
LEIFFNNIAY 
DLILSHGESM 
GGSGYLCEME 
DPAPLECGQG 
NEDGTACVGT 
PSC 



Seq ID NO: 472 DNA sequence 
Nucleic Acid Accession #: FGENESHH 
Coding sequence: 1..4794 



85 



ATGGCGTGTC 
AGCGGCTCCT 
GTTCTGAAGT 
TCACCCTACT 
ATCGACGGGG 
CACAGCAGCT 
CCACCTACAA 
TCCTCCCTGG 
TGTCGGGGTG 
GGGGTGGCCA 
CTGAGCGATG 
GCCTGTGTGG 
GGTAATGTGG 
GGCATTCTGG 
TTCTCCCACA 
GGAGGAGACC 
TGCCGGCTGG 
CAGAGGGAGG 
TCCAAAAGCC 
GCGCCTTCTC 
CCCCTTGTCA 
CCCCACCCCC 
CTGATGGCTG 
CTGAGAAGCT 
GAGCTGGGAG 
CTGGGAGAAC 
CCCAAGGTCA 
GGCCCCGGGA 
CTCTCCCATC 
GTGCCGGGAG 
CTGGCGTGGA 
TTTAGGCTCA 
CTGCAGTTCC 
TCTGCCACTC 
ATCCTCAGCA 
TTCCACAACC 
GCCTTCATCG 
CTAGCAGAAA 
CCACATTGCC 
TTCTTGACGC 
CAGGGGGCCC 
ACTGCCTATT 
TTGTCCTCTG 
GCCCTGGCTG 
CCCCACCGCC 
TCACCCAAGT 
GACCAGGAGC 
CTCTTCCGAT 
GGTCAGGGAG 
AAGGTCAACA 
AGAGGCTGTG 
AAAGGGAAGG 
CCACACTACC 
GTCCAATCAC 
CGGGGTCCAA 
GCTACGGGCT 
AGGGGCTACG 
AGAAAGGGGC 
CCAGGAAAAG 
ACTACCAGGA 
AATCACTACC 
GTCCAATCAC 
CGGGGTCCAA 
GCTATGGGGT 
AGGGGCTATG 
AGAGAGCACG 
GGCCGGGGCA 
TTGTCCCATG 
AACAACAACT 
AAGGTCGTGC 
GGCTACCTGT 
AGTGTGGAGG 



11 
I 

CGGGAGGACT 
CCCCAGCATC 
ATGACCGGGC 
ACGCGCTGCG 
ACGGCCGGGA 
CAGCGCAGGT 
CCCCTGCAGG 
GTCAGGCTTC 
GACTGAGACC 
CGTACACCGA 
AGGTCAACGT 
ACAGAAAGGG 
GCCCTGATGC 
CGCTCAGAGA 
CTGCCTCTCC 
CAGAGGAGGC 
GCTGGAAGGA 
CTGGGGCAGC 
ATTTGGCTGA 
CAGCCCACCC 
CTCAGCTAAT 
GAGCCCCAGG 
AGGCTTTGGG 
GGGAGGAAAG 
GTCCCTGGAG 
CTCCCATTTT 
CACAGGAGTG 
GGGTGGCCAA 
CCCTGGTCCC 
CTGCCCTGCC 
ACCAGATGGA 
GGAAAGCACG 
CCTCAGGCCT 
ACTGTGGGTC 
GCAGTGCCTC 
GGGGCGATGG 
TTCACCTCAA 
CTGGTCCTTC 
ATCATGGTTT 
AAGGCTTGGC 
CACCCTGCCT 
ACATTGTCCT 
AAAGAGTCAA 
ACTTCAACCG 
TCTATCTGCA 
TCTCCATGCC 
TGGAGATCTT 
GCTCCATCCT 
AAGGTTTAAG 
CAGGTCCCCT 
GGAATGCAGG 
GAAATGTGGC 
ACAAAAAGGG 
TACCAGGAAA 
TCACTACCAG 
CCAATCACTA 
GGCTCCAATC 
TACGGGCTCC 
GGGCTACAGG 
AAAGGGGCTA 
AGGAAAA GGG 
TACCACAGAA 
TCACTACCAG 
CCAATCACTA 
GGGTCCAATC 
GAGACCCCCT 
CAGGGGGTGT 
GAGAGTCCAT 
GGCTGCGAGT 
TCTACACCAA 
GTGAGATGGA 
TGACGTGGCC 



21 
I 

CCCAGCCCGT 
CCCTCCCCAT 
CCAGAAGCGG 
GGACCGGCAG 
GGAGAT CTAC 
CCCTTCTGGG 
CCTCCTGGGT 
TCCGGACAGC 
TACCCATGAA 
CAAGTTGTTC 
GGCCCGTGGT 
CTCTGGACGC 
CCT CATTGAA 
TGTGGCTGCT 
AAGCATTGGT 
AGATGAGGAG 
CGGGCAGTTC 
TGGCGTGCCC 
CAAGAACCTA 
TTTCCCTGCC 
GACACATGGA 
AATGGACCCC 
CGCGTGGCCA 
CAGGCAGAAG 
CCAAGCCACA 
ACAAAGAACA 
CCATCTAGTG 
G CGAGAG ATT 
CAACTTCCCC 
TGGGAAT CCT 
AAAAGAGGAG 
GGAAGCAGAA 
CAGAGGCAGC 
GATGTCTTTT 
GGATATCTTC 
CACCTTTGTG 
AT AT CACCT C 
CTCCTCCTGC 
GTCTATGAGC 
CTCCAGTGCC 
TCTGGCAAGA 
GTGGTCTGCC 
CGTGGGTGTG 
TGATGGCAAA 
AATGAGCACC 
CTCCCCTGTC 
CTTCAACAAC 
GGCTCGTGGC 
AATCAGAAGG 
GATGAAGAAA 
GCAAAGCCTG 
CCAAAGTGTG 
GCTACAGGGT 
AGGGGCTACG 
GAAAAGGGGC 
CCAGGAAAAG 
ACTACCAGGA 
AATCACTACC 
GTCCAATCAC 
CGGGGTCCAA 
GCTACAGGGT 
AGGGGCTACG 
GAAAAGGGGC 
CCAGGAAAAG 
ACTACCACAG 
CATCGAGGAG 
GGTGACCGAC 
GGCTCAGCCG 
GGTGCCACGC 
GAAGAGTGGG 
GCCCGTGGCA 
AGATGGCAAG 



31 
I 

TGCTCTGGTT 
TCCTCCTCCA 
CTGGTGAACA 
GGGAACGCCA 
TTCCTCAACA 
CTCCACAGAA 
CTGCCTCCAC 
AGGCAGGGAG 
CCAGAACCAT 
AAGTTCCGCA 
GTGGCCAGCC 
TACTCTATCT 
ATGGACCCTG 
GAGGCTGGGG 
GAGATATCTG 
CACAGTGGGG 
AAGGAAGAAG 
AGAGGACGTG 
TTTGGCCCAC 
CGCCAAGCCC 
CGTCTGGCTG 
AAATGTAAGG 
GCGCTCAGCA 
GGGCAGGCCA 
CAGCACCTGC 
GACGGAGATC 
GCCACCATGC 
GGGAGAGAGA 
AGCTGCTTGA 
GGGAACTGGG 
GGGAAGATTC 
TTCCCCCCAG 
CCTGTCCTCC 
CTAGGGGGCC 
TGCGACAATG 
GACGCTGCGG 
TGCAGAGATT 
TGCCCGTGGC 
TTTACAAGGA 
CACCGGAGGA 
GCTCCCTGTG 
ATCCCAGAGA 
GACGACCCCC 
GTGGACATCG 
CATGGGAAGG 
CGCACGGTCA 
ATTGCCTACC 
TCTTCATCCT 
GGAGGGTTCC 
CAGAAAGGAA 
GCCAAGGAGC 
CCCAGAACCC 
CCAATCACTA 
GGGTCCAATC 
TACGGGGTCC 
GGGCTACAGG 
AAAGGGGCTA 
AGGAAAAGGG 
TACCAGGAAA 
TCACTACCAG 
CCAATCACTA 
GGCTCCAATC 
TACGGGCTCC 
GGGCTACGGG 
AAAGGGGCTA 
CTCAATCCCG 
TTCGACGGAG 
CTGTCCGTCT 
ACCCGGTTTG 
GCCCACCTGA 
CACTTTGGCC 
ATGGTGAGCC 



41 
I 

GGATGGGACT 
GGTACAATGG 
TCGCGGTCGA 
TCGGGGTCAC 
CCAATAATGC 
ACAGGCCTGT 
TCAGCGGAAG 
AGAGGGTGCC 
TTCTTCTGAG 
ATAACCGGTG 
TCTTTGCCGG 
ACATTGCCAA 
AGGCCAGTGA 
TCAGCAAATA 
GCAGAACCGA 
ATGGAAGCAC 
CAGCAGCTTT 
TTCGAACAGC 
CATGTTACTA 
CCCAACACTA 
GAAAACTAGC 
GCCGCCATGC 
CCACTGTGGT 
TGTCCAGATG 
CTGCTAGAGA 
CAGGGAGGAG 
CAGCTCTCGG 
CTGGGGCAGT 
GGCCTCTTGA 
TTCTGGACAT 
ATGGAGACCA 
GCTCCTCTGA 
AGGTGGGCCT 
GAGGCGTCAG 
AGAATGGGCC 
CCAGTGCTGA 
TTCCTCACTC 
ATGCACGTCT 
CCGGGTCACG 
CACTCAGCCT 
TCCTGGGGTC 
GCCTGATGAC 
ACCAGCATGG 
TCTATGGCAA 
TCCGCTTCCG 
TCACCGCCGA 
GCAGCTCCTC 
TGACAGCTGG 
CAGGGCCAGG 
GGAAGGACGA 
CGGCCTCTGC 
AAGCGCCACA 
CCAGGAAAAG 
ACTACCAGGA 
AATCACTACC 
GTCCAATCAC 
CAGGGTCCAA 
GCTACGGGGT 
AGGGGCTACG 
GAAAAGGGGC 
CCAGGAAAAG 
ACTACCAGGA 
AATCACTACC 
CTCCAATCAC 
CGGGGTCCAA 
GCGACGCCTT 
ACGGGATGCT 
TCCGGGGCAA 
GGGCCTTTGC 
GGATCATCGA 
TGGGGAAGGA 
GGAACGTGGC 



51 
I 

GGGTGGGCCC 
ACCCAACCTG 
TGAGCGCAGC 
AGCCTGCGAC 
CTTCTCGGGC 
GCTGAAGCCT 
GGACTTTTCC 
GGTTCCCTGC 
ACCCAAATCA 
GGAAGACATC 
ACGCTCTGTG 
TTACGCCTAC 
CCTCTCCCGG 
TACAGAAGGC 
GGAGCGGGAA 
CAGCCAACTG 
GGTGGAGGAA 
TCTGCAGACT 
TTCTGTCTGC 
CCCTGTAGCC 
CCGGAGTGTC 
TGAGCCCGGC 
GCCAGGGGGC 
TGCACTCAGG 
GCTGTATGAC 
AAGGGACTCG 
GGGACTCGAG 
AGGAAGACCA 
AGCCGGGACA 
GGCCAAGGCC 
TGAGCCCAGA 
GGAGCCTCTG 
GGGGCTTGCT 
CGTGGGCCCC 
TAACTTCCTT 
ACGTCGTTTA 
CCTGTGCCAC 
TCTTCAGGCT 
GTTCTATTCA 
CCAGGGTTCT 
TCTGATCCCC 
CCACAGCTAT 
GCGAGGTGTC 
CTGGAATGGC 
GGACATCGCC 
CTTTGACAAT 
AGCCAACCGC 
TGGGAGGAAC 
GGGTCAGGCC 
GGACTGGGCA 
TATTGCAGGG 
AGATACAAAG 
GGGCTACGGG 
AAAGGGGCTA 
AGGAAAAGGG 
TACCAGGAAA 
TCACTACCAC 
CCAATCACTA 
GGGTCCAATC 
TACGGGGTCC 
GGGCTACAGG 
AAAGGGGCTA 
AGGAAAAGAG 
TACCAGGAAA 
CGTCAT CCGT 
GGAGCCTGAG 
GGACCTCATC 
TCAGGGCTTC 
CAGGGGAGCT 
CGGGGGCTCA 
TGAAGCCAGC 
CAGCGGGGAG 
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367 



WO 02/086443 

ATGAACTCAG TGCTGGAGAT CCTCTACCCC CGGGATGAGG ACACACTTCA GGACCCAGCC 
CCACTGGAGT GTGGCCAAGG ATTCTCCCAG CAGGAAAATG GCCATTGCAT GGACACCAAT 
GAATGCATCC AGTTCCCATT CGTGTGCCCT CGAGACAAGC CCGTATGTGT CAACACCTAT 
GGAAGCTACA GGTGCCGGAC CAACAAGAAG TGCAGTCGGG GCTACGAGCC CAACGAGGAT 
GGCACAGCCT GCGTGGGTAC TGAGCTAGGC TCTAGGCATA CAATGACGTG GAAAC CAAGG 
CCCAAAAAGG AGCTGCAACT TTCCCAAGGC ATCTGCACCC CCGTCTGGTC CTTTTTCCTG 
CCGGGTTGCC GGCTGCTCCT CAAAAGAGCT CAGCTCCAGG CTGCTCCCAG CACCCTTCTC 
CAGAAAGCTC CAGGTATTCC AGAAG CCCAA GTGTATGAAC AAGATCAGGA ATAA 

Seq ID NO: 473 Protein sequence 
Protein Accession #: FGENESH predicted 

1 11 21 31 41 51 

I I I 1 I I 

MACPGGLPAR CSGWMGLGGP SGSSPASPPH SSSRYNGPNL VLKYDRAQKR LVNIAVDERS 

SPYYALRDRQ GNAI GVTACD IDGDGREEIY FLNTNNAFSG HSSSAQVPSG LHRNRPVLKP 

PPTTPAGLLG LPPLSGRDFS SSLGQASPDS RQGERVPVPC CRGGLRPTHE PEPFLLRPKS 

GVATYTDKLF KFRNNRWED I LSDEVNVARG VASLFAGRSV ACVDRKGSGR YSIYIANYAY 

GNVGPDALIE MDPEASDLSR GILALRDVAA EAGVSKYTEG FSHTASPSIG EISGRTEERE 

GGDPEEADEE HSGDGSTSQL CRLGWKDGQF KEEAAALVEE QREAGAAGVP RGRVRTALQT 

SKSHLADKNL FGPPCYYSVC APSPAHPFPA RQAPQHYPVA PLVTQLMTHG RLAGKLARSV 

PHPRAPGMDP KCKGRHAEPG LMAEALGAWP ALSTTWPGG LRSWEESRQK GQAMSRCALR 

ELGGPWSQAT QHLPARELYD LGEPPILQRT DGDPGRRRDS PKVTQECHLV ATMPALGGLE 

GPGRVAKREI GRETGAVGRP LSHPLVPNFP SCLRPLEAGT VPGAALPGNP GNWVLDMAKA 

LAWNQMEKEE GKIHGDHEPR FRLRKAREAE FPPGSSEEPL LQFPSGLRGS PVLQVGLGLA 

SATHCGSMSF LGGRGVSVGP ILSSSASDIF CDNENGPNFL FHNRGDGT F V DAAASAERRL 

AFIVHLKYHL CRDFPHSLCH LAETGPSSSC CPWHARLLQA PHCHHGLSMS FTRTGSRFYS 

FLTQGLASSA HRRTLSLQGS QGAPPCLLAR APCVLGSLIP TAYYIVLWSA IPESLMTHSY 

LSSERVNVGV DDPHQHGRGV ALADFNRDGK VD I VYGNWNG PHRLYLQMST HGKVRFRD I A 

SPKFSMPSPV RTVITADFDN DQELEIFFNN IAYRSSSANR LFRCSILARG SSSLTAGGRN 

GQGEGLRIRR GGFPGPGGQA KVNTGPLMKK QKGRKDEDWA RGCGNAGQSL AKE PA S A I AG 

KGKGNVAQSV PRTQAPQDTK PHYHKKGLQG PITTRKRGYG VQSLPGKGAT GSNHYQEKGL 

RGPITTRKRG YGVQSLPGKG ATGSNHYQEK GLQGPITTRK RGYGLQSLPG KGATGSNHYH 

RKGLRAPITT RKRGYGVQSL PGKGATGSNH YQEKGLRGPI TTRKRGYGLQ SLPGKGATGS 

NHYQEKGLQG PITTRKRGYR VQSLPQKGAT GSNHYQEKGIi RGPITTRKRG YGLQSLPGKE 

AMGSNHYQEK GLRAPITTRK RGYGVQSLPQ KGATGSNVIR REHGDPLIEE LNPGDALEPE 

GRGTGGWTD FDGDGMLDLI LSHGESMAQP LSVFRGNQGF NNNWLRWPR TRFGAFARGA 

KWLYTKKSG AHLRIIDGGS GYLCEMEPVA HFGLGKDEAS SVEVTWPDGK MVSRNVASGE 

MNSVLEILYP RDEDTLQDPA PLECGQGFSQ QENGHCMDTN ECIQFPFVCP RDKPVCVNTY 

GSYRCRTNKK CSRGYEPNED GTACVGTELG SRHTMTWKPR PKKELQLSQG ICTPVWSFFL 

PGCRLLLKRA QLQAAPSTLD QKAPGIPEAQ VYEQDQE 

Seq ID NO: 474 DNA sequence 

Nucleic Acid Accession #: NMJD03661.1 

Coding sequence: 1..1152 

1 11 21 31 41 51 

I I I I I I 

ATGAGTGCAC TTTTCCTTGG TGTGGGAGTG AGGGCAGAGG AAGCTGGAGC GAGGGTGCAA 
CAAAACGTTC CAAGTGGGAC AGATACTGGA GATCCTCAAA GTAAGCCCCT CGGTGACTGG 
GCTGCTGGCA CCATGGACCC AGAGAGCAGT AT CTTTATTG AGGATGCCAT TAAGTATTTC 
AAGGAAAAAG TGAGCACACA GAATCTGCTA CTCCTGCTGA CTGATAATGA GGCCTGGAAC 
GGATTCGTGG CTGCTGCTGA ACTGCCCAGG AATGAGGCAG ATGAGCTCCG TAAAGCTCTG 
GACAACCTTG CAAGACAAAT GATCATGAAA GACAAAAACT GGCACGATAA AGGCCAGCAG 
TACAGAAACT GGTTTCTGAA AGAGTTTCCT CGGTTGAAAA GTGAGCTTGA GGATAACATA 
AGAAGGCTCC GTGCCCTTGC AGATGGGGTT CAGAAGGTCC ACAAAGGCAC CACCATCGCC 
AATGTGGTGT CTGGCTCTCT CAGCATTTCC TCTGGCATCC TGACCCTCGT CGG CATGGGT 
CTGGCACCCT TCACAGAGGG AGGCAGCCTT GTACTCTTGG AACCTGGGAT GGAGTTGGGA 
ATCACAGCCG CTTTGACCGG GATTACCAGC AGTACCATGG ACTACGGAAA GAAGTGGTGG 
ACACAAGCCC AAGCCCACGA CCTGGTCATC AAAAGCCTTG ACAAATTGAA GGAGGTGAGG 
GAGTTTTTGG GTGAGAACAT ATCCAACTTT CTTTCCTTAG CTGGCAATAC TTACCAACTC 
ACACGAGGCA TTGGGAAGGA CATCCGTGCC CTCAGACGAG CCAGAGCCAA TCTTCAGTCA 
GTACCGCATG CCTCAGCCTC ACGCCCCCGG GTCACTGAGC CAATCTCAGC TGAAAGCGGT 
GAACAGGTGG AGAGGGTTAA TGAACCCAGC ATCCTGGAAA TGAGCAGAGG AGTCAAGCTC 
ACGGATGTGG CCCCTGTAAG CTTCTTTCTT GTGCTGGATG TAGTCTACCT CGTGTACGAA 
TCAAAGCACT TACATGAGGG GGCAAAGTCA GAGACAGCTG AGGAGCTGAA GAAGGTGGCT 
CAGGAGCTGG AGGAGAAGCT AAACATTCTC AACAATAATT ATAAGATTCT GCAGGCGGAC 
CAAGAACTGT GA 

Seq ID NO: 475 Protein sequence 
Protein Accession #: NP_0 03 652.1 

1 11 21 31 41 51 

I I I I I I 

MSALFLGVGV RAEEAGARVQ QNVPSGTDTG DPQSKPLGDW AAGTMDPESS IFIEDAIKYF 

KEKVSTQNLL LLL.TDNEAWN GFVAAAELiPR NEADELRKAIj DNLARQMIMK DKNWHDKGQQ 

YRNWFLKEFP RLKSELEDNI RRLRALADGV QKVHKGTTIA NWSGSLSIS SGILTLVGMG 

LAPFTEGGSL VLLEPGMELG ITAALTGITS STMDYGKKWW TQAQAHDLVI KSLDKLKEVR 

EFLGENISNF LSLAGNTYQL TRGIGKDIRA LRRARANLQS VPHASASRPR VTEPISAESG 

EQVERVNEPS ILEMSRGVKL TDVAPVSFFL VLDWYLVYE SKHLHEGAKS ETAEELKKVA 

QELEEKLNIL NNNYKILQAD QEL 

Seq ID NO: 476 DNA sequence 

Nucleic Acid Accession #: NMJ314452.1 

Coding sequence: 1..1968 

1 11 21 31 41 51 
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I I 

ATGGGGACCT CTCCGAGCAG 
GCCACAGCCA CGATGATCGC 
GCTCAGCCAG AACAGAAGGC 
ACCGGCCAGG TGCTAACCTG 
ACCAACACAA GCCTGCGCGT 
AATGGCATAG AGAAATGCCA 
TTACCTTGTG CTGCCTTGAC 
AACGCTACCT GTGCCCCCCA 
ACAGAGACTG AGGATGTGCG 
TCTAGTGTGA TGAAATGCAA 
AAGCCGGGGA CCAAGGAGAC 
ACCTCACCTT CCCCTGGCAC 
GTCCCTTCCT CCACTTATGT 
TCTGTTAGAC CAAAGGTACT 
TCAGCAAGGG GGAAGGAAGA 
CAGCAAGGCC CCCACCACAG 
GGCGAGAAGT CCAGCACGCC 
CACAAGCATT TTGACATCAA 
GTGCTTGTGG TGATTGTGGT 
CCCCGGCAGG ATCCCAGTGC 
ACCCAGAACC GGGAGAAATG 
CTTGTAGCAG CCCAAGTGGG 
AGTGAGAGGG AGGTTGCTGC 
GCAGCTCTGC AGCACTGGAC 
GCCCTGCGCC AGCACCGGAG 
ACCACCCAGC TGGAAACTGA 
AGCCCCATCC CCAGCCCCAA 
TCCCCACAGG ACAAGAACAA 
GACTCTACAT CCAGCGGCTC 
AAGAAGGACA CAGTGTTGCG 
GATGACATGC TCCACTTTCT 
GCTGAGGACA AACTAGACCG 
CAGACCCTCC TGGACTCTGT 
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CAGCACCGCC 
GGGCTCCCTT 
CTCGAATCTC 
TGACAAGTGT 
CTG CAGCAGT 
TGACTGTAGT 
TGACCGAGAA 
TACGGTGTGT 
GTGTAAGCAG 
AG CAT ACACA 
AGACAACGTC 
AGCCATCTTT 
TCCCAAAGGC 
GAGTAGCATC 
CGTGAACAAG 
ACACATCCTG 
CATCAAGGGC 
TGAGCATTTG 
GTGCAGTATC 
CATTGTGGAA 
GAT CTACTAC 
AAGCCAGTGG 
TTTCTCCAAT 
CATCCGGGGC 
AAACGATGTT 
CAAACTAGCT 
CGCGAAACTT 
GGGCTTCTTC 
CTCCGCGCTG 
GCAGGTACGC 
AAATCCTGAG 
GCTATTCGAA 
TTATAGCCAT 



CTCGCCTCCT 
CTCCTGCTTG 
ATTGGCACAT 
CCAGCAGGAA 
TGCCCTGTGG 
CAGCCATGCC 
TGCACTTGCC 
CCTGTGGGTT 
TGTGCTCGGG 
GACTGTCTGA 
TGTGGCACAC 
CCACGCCCTG 
ATGAACTCAA 
CAGGAAGGGA 
ACCCTCCCAA 
AAGCTGCTGC 
CCCAAGAGGG 
CCCTGGATGA 
CGGAAAAGCT 
AAGGCAGGGC 
TGCAATGGCC 
AAAGATATCT 
GGGTACACAG 
CCCGAGGCCA 
GTGGAGAAGA 
CTCCCGATGA 
GAGAATTCCG 
GTGGATGAGT 
AGCAGGAACG 
CTGGACCCCT 
GAGCTGCGGG 
ATTATTGGAG 
CTTCCTGACC 



GCAGCCGCAT 
GATTCCTTAG 
ACCGCCATGT 
CCTATGTCTC 
GGACCTTTAC 
CATGGCCAAT 
CACCTGGCAT 
GGGGTGTGCG 
GTACCTTCTC 
GTCAGAACCT 
TCCCGTCCTT 
AG CACATGGA 
CAGAATCCAA 
CAGTCCCTGA 
ACCTTCAGGT 
CGTCCATGGA 
GACATCCTAG 
TTGTGCTTTT 
CGAGGACTCT 
TGAAGAAATC 
ATGGTATCGA 
ATCAGTTTCT 
CCGACCACGA 
GCCTCGCCCA 
TTCGTGGGCT 
GCCCCAGCCC 
CT GT C CTG AC 
CGGAGCCCCT 
GTTCCTTTAT 
GTGACTTGCA 
TGATTGAAGA 
TCAAGAGCCA 
TGCTGTAG 



CGCCCGCCGA 60 

CACCACCACA 120 

TGACCGTGCC 180 

TGAGCATTGT * 240 

CAGGCATGAG 300 

GATTGAGAAA *I'360 

GTTCCAGTCT 420 

GAAGAAAGGG 480 

AGATGTGCCT 540 

GGTGGTGATC 600 

CTCCAGCTCC 660 

AACCCATGAA 720 

CTCTTCTGCC 780 

CAACACAAGC 840 

AGTCAACCAC 900 

GGCCACTGGG 960 

ACAGAACCTA 1020 

CCTGCTGCTG 1080 

GAAAAAGGGG 1140 

CATGACTCCA 1200 

TAT CCTGAAG 1260 

TTGCAATGCC 1320 

GCGGGCCTAC 13 80 

GCTAATTAGC 1440 

GATGGAAGAC 1500 

GCTTAGCCCG 1560 

GGTGGAGCCT 1620 

TCTCCGCTGT 1680 

TACCAAAGAA 1740 

GCCTATCTTT 1800 

GATTCCCCAG 1860 

GGAAGCCAGC 1920 
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40 



45 



50 



MGTSPSSSTA 
TGQVLTCDKC 
LPCAALTDRE 
SSVMKCKAYT 
VPSSTYVPKG 
QQGPHHRHIL 
VLWIWCSI 
LVAAQVGSQW 
ALRQHRRNDV 
SPQDKNKGFF 
DDMLHPLNPE 



11 
i 

LASCSRIARR 
PAGTYVSEHC 
CTCPPGMFQS 
DCLSQNLWI 
MNSTESNSSA 
KLLPSMEATG 
RKSSRTLKKG 
KDIYQFLCNA 
VEKIRGLMED 
VDESEPLLRC 
ELRVIEEIPQ 



21 
1 

ATATMIAGSL 
TNTSLRVCSS 
NAT CAPHT VC 
KPGTKETDNV 
SVRPKVLSSI 
GEKSSTPIKG 
PRQDPSAIVE 
SEREVAAFSN 
TTQLETDKLA 
DSTSSGSSAL 
AEDKLDRLFE 



31 
1 

LLLGFLSTTT 
CPVGTFTRHE 
PVGWGVRKKG 
CGTLPSFSSS 
QEGTVPDNTS 
PKRGHPRQNL 
KAGLKKSMTP 
GYTADHERAY 
LPMSPSPLSP 
SRNGSFITKE 
IIGVKSQEAS 



41 
I 

AQPEQKASNL 
NGIEKCHDCS 
TETEDVRCKQ 
TSPSPGTAIF 
SARGKEDWK 
HKHFDINEHL 
TQNREKWIYY 
AALQHWTIRG 
SPIPSPNAKL 
KKDTVLRQVR 
QTLLDSVYSH 



51 
1 

IGTYRHVDRA 60 

QPCPWPMIEK 120 

CARGTFSDVP 180 

PRPEHMETHE 240 

TLPNLQWNH 300 

PWMIVLFLLL 360 

CNGHGIDILK 420 

PEASLAQLIS 480 

ENSALLTVEP 540 

LDPCDLQPIF 600 
LPDLL 



55 



Seq ID NO: 478 DNA sequence 

Nucleic Acid Accession #: XM_044533 

Coding sequence: 238.. 2751 
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70 



75 



80 



85 



GCTCTGCCCA 
AGGGGCTGAG 
GGAGGCGGGG 
AGTCCGGCCG 
CTGCGCACCG 
CGGCCACCGC 
TGGGCGCTCA 
TTCGAAGCTG 
CTGTACGTGG 
GGCGGGGAGT 
TTCAAGGGCA 
AGCGGCAGTC 
AACATGGAGA 
AAGGGCCGTT 
CTCTACACTG 
AGCCTTCGCC 
GCCTCAGCCT 
TTTTTCTTCA 
ATTGCCCGCA 
TCCTTCCTCA 
CTGCAGGATG 
GGGGTCTTCA 
ACAATGAAGG 
CAGCAGTGGT 
AACAGTGCCC 
TTCCTCAAGG 
CCCCAGGCTC 
GATGTCCTCT 
CGGGTGCACA 



AGCCGAGGCT 
TTTGCCAGGG 
GCCCCCGGGG 
AGCCACCTGA 
CGATGGGCCT 
TGCTGCTGCT 
GCCCCCGGAT 
AACACATCTC 
GTGCTCGAGA 
ACCAGGAGCT 
AGGACCCACA 
ACCTGTT CAC 
ACTTCACCCT 
GTCCCTTCGA 
GAACAGTCAG 
CCACCAAGAC 
ACATTCCTGA 
GCGAGACTGG 
TCTGCAAGGG 
AGGCCCAGCT 
TCTTCACGCT 
CTTCCCAGTG 
ATGTGCAGAG 
ACACCGTGAC 
GGGAAAGGAA 
ACCACTTCCT 
GCTACCAGCG 
TCCTGGGCAC 
TCATTGAGGA 



GCGGGGCCGG 
CCCACTTGAC 
CGACTCGGGG 
GCCCGAGCCG 
GAGGAGCTGG 
CCTGCTGCTG 
CAGCCTGCCT 
CAACTACACA 
GGCCCTCTTT 
GCTTTGGGGT 
GCGCGACTGT 
CTGTGGCACA 
GGCAAGGGAC 
CCCGAATTTC 
CAGCTTCCAA 
CGAGAGCTCC 
GAGCCTGGGC 
CCAGGAATTT 
CGATGAGGGT 
GCTGTGCTCA 
GAGCCCCAGC 
GCACAGGGGA 
AGTCTTCAGC 
CCACCCGGTG 
GATCAACTCA 
GATGGACGGG 
CGTGGCTGTA 
TGGTGACGGC 
GCTGCAGATC 



31 

I 

CGCCGGCGGG 
CCTGTTTCCC 
GCGGACCGCG 
CGGGACACCG 
CTCGCCGCCC 
CTGCTCCTGC 
CTGGGCTCTG 
GCCCTTCTGC 
GCACTCAGTA 
G CAGACGCAG 
CAAAACTACA 
GCAGCCTTCA 
GAGAAGGGGA 
AAGTCCACTG 
GGGAATGACC 
CT C AACTGGC 
AGCTTG CAAG 
GAGTTCTTTG 
GGAGAGCGGG 
CGGCCCGACG 
CCCCAGGACT 
ACTACAGAAG 
GGCCTCTACA 
CCCACACCCC 
TCCCTGCAGC 
CAGGTCCGAA 
CACCGCGTCC 
CGGCTCCACA 
TTCTCATCGG 



41 
I 

AGGACTGCGG 
ACCTCCCGCC 
GGGCGGAGCT 
TCGCTCCTGC 
CATGGGGCGC 
TGCAGCCGCC 
AAGAGCGGCC 
TGAGCAGGGA 
GCAACCTCAG 
AGAAGAAACA 
TCAAGATCCT 
GCCCCATGTG 
ATGTCCTCCT 
CCCTGGTGGT 
CGGCCATCTC 
TGCAAGACCC 
GCGATGATGA 
AGAACACCAT 
TGCTACAGCA 
ATGGCTTCCC 
GGCGTGACAC 
GCTCTGCCGT 
AGGAGGTGAA 
GGCCTGGAGC 
TCCCAGACCG 
GCCGCATGCT 
CTGGCCTGCA 
AGGCAGTGAG 
GACAG CCCGT 



51 
I 

TGCCCCGCGG 60 

CCCCAGGTCC 12 0 

GCCGCCCGTG 180 

TCTCCGAATG 240 

GCTGCCGCCT 3 00 

GCCTCCGACC 360 

ATTCCTCAGA 42 0 

TGGCAGGACC 480 

CTTCCTGCCA 540 

GCAGTGCAGC 600 

CCTGCCGCTC 660 

TACCTACATC 720 

GGAAGATGGC 7 80 

TGATGGCGAG 840 

GCGGAGCCAA 900 

AGCTTTTGTG 960 

CAAGATCTAC 1020 

TGTGTCCCGC 1080 

GCGCTGGACC 1140 

CTTCAACGTG 1200 

CCTTTTCTAT 1260 

CTGTGTCTTC 1320 

CCGTGAGACA 13 80 

GTGCATCACC 1440 

CGTGCTGAAC 1500 

GCTGCTGCAG 1560 

CCACACCTAC 1620 

CGTGGGCCCC 1680 

GCAGAATCTG 1740 



369 
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CTCCTGGACA CCCACAGGGG GCTGCTGTAT GCGGCCTCAC ACTCGGGCGT AGTCCAGGTG 180 0 

CCCATGGCCA ACTGCAGCCT GTACAGGAGC TGTGGGGACT GCCTCCTCGC CCGGGACCCC 1860 

TACTGTGCTT GGAGCGGCTC CAGCTGCAAG CACGTCAGCC TCTACCAGCC TCAGCTGGCC 192 0 

ACCAGGCCGT GGAT CCAGG A CAT CGAGGGA GCCAGCGCCA AGGACCTTTG CAGCGCGTCT 1980 

TCGGTTGTGT CCCCGTCTTT TGTACCAACA GGGGAGAAGC CATGTGAGCA AGTCCAGTTC 2040 

CAGCCCAACA CAGTGAACAC TTTGGCCTGC CCGCTCCTCT CCAACCTGGC GACCCGACTC 2100 

TGGCTACGCA ACGGGGCCCC CGTCAATGCC TCGGCCTCCT GCCACGTGCT ACCCACTGGG 2160 

GACCTGCTGC TGGTGGGCAC CCAACAGCTG GGGGAGTTCC AGTGCTGGTC ACTAGAGGAG 2220 

GGCTTCCAGC AGCTGGTAGC CAG CTACTGC CCAGAGGTGG TGGAGGACGG GGTGGCAGAC 22 80 

CAAACAGATG AGGGTGGCAG TGTACCCGTC ATTATCAGCA CATCGCGTGT GAGTGCACCA 2340 

GCTGGTGGCA AGGCCAGCTG GGGTGCAGAC AGGTCCTACT GGAAGGAGTT CCTGGTGATG 2400 

TGCACGCTCT TTGTGCTGGC CGTGCTGCTC CCAGTTTTAT TCTTGCTCTA CCGGCACCGG 2460 

AACAGCATGA AAGTCTTCCT GAAGCAGGGG GAATGTGCCA GCGTGCACCC CAAGACCTGC 2520 

CCTGTGGTGC TGCCCCCTGA GACCCGCCCA CTCAACGGCC TAGGGCCCCC TAGCACCCCG 2580 

CTCGATCACC GAGGGTACCA GTCCCTGTCA GACAGCCCCC CGGGGTCCCG AGTCTTCACT 2640 

GAGTCAGAGA AGAGGCCACT CAGCATCCAA GACAGCTTCG TGGAGGTATC CCCAGTGTGC 2700 

CCCCGGCCCC GGGTCCGCCT TGGCTCGGAG AT CCGTG ACT CTGTGGTGTG AGAGCTGACT 2760 

TCCAGAGGAC GCTGCCCTGG CTTCAGGGGC TGTGAATGCT CGGAGAGGGT CAACTGGACC 2820 

TCCCCTCCGC TCTGCTCTTC GTGGAACACG ACCGTGGTGC CCGGCCCTTG GGAGCCTTGG 2 880 

GGCCAGCTGG CCTGCTGCTC TCCAGT CAAG TAGCGAAGCT CCTACCACCC AGACACCCAA 2 940 

ACAGCCGTGG CCCCAGAGGT CCTGGCCAAA TATGGGGGCC TGCCTAGGTT GGTGGAACAG 3 000 

TGCTCCTTAT GTAAACTGAG CCCTTTGTTT AAAAAACAAT TCCAAATGTG AAACTAGAAT 3060 

GAGAGGGAAG AGATAGCATG GCATGCAGCA CACACGGCTG CTCCAGTTCA TGGCCTCCCA 312 0 

GGGGTGCTGG GGATGCATCC AAAGTGGTTG TCTGAGACAG AGTTGGAAAC CCTCACCAAC 3180 

TGGCCTCTTC ACCTTCCACA TTATCCCGCT GCCACCGGCT GCCCTGTCTC AC TG CAG ATT 3 240 

CAGGACCAGC TTGGGCTGCG TGCGTTCTGC CTTGCCAGTC AGCCGAGGAT GTAGTTGTTG 330 0 

CTGCCGTCGT CCCACCACCT CAGGGACCAG AGGGCTAGGT TGGCACTGCG GCCCTCACCA 3360 

GGTCCTGGGC TCGGACCCAA CTCCTGGACC TTTCCAGCCT GTATCAGGCT GTGGCCACAC 3420 

GAGAGGACAG CGCGAGCTCA GGAGAGATTT CGTGACAATG TACGCCTTTC CCTCAGAATT 3480 

CAGGGAAGAG ACTGTCGCCT GCCTTCCTCC GTTGTTGCGT GAGAACCCGT GTGCCCCTTC 3540 

CCACCATATC CACCCTCGCT CCATCTTTGA ACTCAAACAC GAGGAACTAA CTGCACCCTG 3600 

GTCCTCTCCC CAGTCCCCAG TTCACCCTCC ATCCCTCACC TTCCTCCACT CTAAGGGATA 3660 

TCAACACTGC CCAG CACAGG GGCCCTGAAT TTATGTGGTT TTTATACATT TTTTAATAAG 3720 
ATGCACTTTA TGTCATTTTT TAATAAAGTC TGAAGAATTA CTGTTT 

Seq ID NO: 479 Protein sequence 
Protein Accession #: XP_044533.3 

1 11 21 31 41 51 

I I I I I 1 

MLRTAMGLRS WLAAPWGALP PRPPLLLLLL LLLLLQPPPP TWALSPRISL PLGSEERPFL 60 

RFEAEHISNY TALLLSRDGR TLYVGAREAL FALSSNLSFL PGGEYQELLW GADAEKKQQC 120 

SFKGKDPQRD CQNYIKILLP LSGSHLFTCG TAAFSPMCTY INMENFTLAR DEKGNVLLED 180 

GKGRCPFDPN FKSTALWDG ELYTGTVSSF QGNDPAISRS QSLRPTKTES SLNWliQDPAF 240 

VASAYIPESL GSLQGDDDKI YFFFSETGQE FEFFENTIVS RIARICKGDE GGERVLQQRW 300 

TSFLKAQIjLC SRPDDGFPFN VLQDVFTLSP SPQDWRDTLF YGVFTSQWHR GTTEGSAVCV 360 

FTMKDVQRVF SGIiYKEVNRE TQQWYTVTHP VPTPRPGACI TNSARERKIN SSLQLPDRVIi 42 0 

NFLKDHFLMD GQVRSRMLLL QPQARYQRVA VHRVPGLHHT YDVLFLGTGD GRLHKAVSVG 480 

PRVHIIEELQ IFSSGQPVQN LLLDTHRGLL YAASHSGWQ VPMANCSLYR SCGDCLLARD 540 

PYCAWSGSSC KHVSLYQPQL ATRPWIQDIE GASAKDLCSA SSWSPSFVP TGEKPCEQVQ 60 0 

FQPNTVNTLA CPLLSNLATR LWLRNGAPVN ASASCHVLPT GDLLLVGTQQ LGEFQCWSLE 660 

EGFQQLVASY CPEWEDGVA DQTDEGGSVP VIISTSRVSA PAGGKASWGA DRSYWKEFLV 720 

MCTLFVLAVL LPVLFLLYRH RNSMKVFLKQ GECASVHPKT CPWLPPETR PLNGLGPPST 780 
PLDHRGYQSL SDSPPGSRVF TESEKRPLSI QDSFVEVSPV CPRPRVRLGS EIRDSW 

Seq ID NO: 480 DNA sequence 

Nucleic Acid Accession #: NM_004217.1 

Coding sequence: 58., 1092 

1 11 21 31 41 51 

! | I I I I 

GGCCGGGAGA GTAGCAGTGC CTTGGACCCC AGCTCTCCTC CCCCTTTCTC TCTAAGGATG 6 0 

GCCCAGAAGG AGAACTCCTA CCCCTGGCCC TACGGCCGAC AGACGGCTCC ATCTGGCCTG 12 0 

AGCACCCTGC CCCAGCGAGT CCTCCGGAAA GAGCCTGTCA CCCCATCTGC ACTTGTCCTC 180 

ATGAGCCGCT CCAATGTCCA GCCCACAGCT GCCCCTGGCC AGAAGGTGAT GGAGAATAGC 240 

AGTGGGACAC CCGACATCTT AACGCGGCAC TTCACAATTG ATGACTTTGA GATTGGGCGT 300 

CCTCTGGGCA AAGGCAAGTT TGGAAACGTG TACTTGGCTC GGGAGAAGAA AAGCCATTTC 360 

ATCGTGGCGC TCAAGGTCCT CTTCAAGTCC CAGATAGAGA AGGAGGGCGT GGAGCATCAG 420 

CTGCGCAGAG AGAT CGAAAT CCAGGCCCAC CTGCACCATC CCAACATCCT GCGTCTCTAC 480 

AACTATTTTT ATGACCGGAG GAGGATCTAC TTGATTCTAG AGTATGCCCC CCGCGGGGAG 540 

CTCTACAAGG AGCTGCAGAA GAGCTGCACA TTTGACGAGC AGCGAACAGC CACGATCATG 600 

GAGGAGTTGG CAGATGCTCT AATGTACTGC CATGGGAAGA AGGTGATTCA CAGAGACATA 660 

AAG CCAG AAA ATCTGCTCTT AGGGCTCAAG GGAGAGCTGA AGATTGCTGA CTTCGGCTGG 72 0 

TCTGTGCATG CGCCCTCCCT GAG GAGG AAG ACAATGTGTG GCACCCTGGA CTACCTGCCC 780 

CCAGAGATGA TTGAGGGGCG CATGCACAAT GAGAAGGTGG ATCTGTGGTG CATTGGAGTG 840 

CTTTGCTATG AGCTGCTGGT GGGGAACCCA CCCTTTGAGA GT G CAT CACA CAACGAGACC 90 0 

TATCGCCGCA TCGTCAAGGT GGACCTAAAG TTCCCCGCTT CTGTGCCCAC GGGAGCCCAG 960 

GACCTCATCT CCAAACTGCT CAGGCATAAC CCCTCGGAAC GGCTGCCCCT GGCCCAGGTC 102 0 

TCAGCCCACC CTTGGGTCCG GGCCAACTCT CGGAGGGTGC TGCCTCCCTC TGCCCTTCAA 1080 

TCTGTCGCCT GATGGTCCCT GTCATTCACT CGGGTGCGTG TGTTTGTATG TCTGTGTATG 1140 

TATAGGGGAA AGAAGGG AT C CCTAACTGTT CCCTTATCTG TTTTCTACCT CCTCCTTTGT 1200 
TTAATAAAGG CTGAAGCTTT TTGT 

Seq ID NO: 481 Protein sequence 
Protein Accession #: NP_004208 

1 ll 21 31 41 51 
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MAQKENSYPW PYGRQTAPSG LSTLPQRVLR KEPVTPSALV LMSRSNVQPT AAPGQKVMEN 

SSGTPDILTR HFTIDDFEIG RPLGKGKFGN VYLAREKKSH F I VALKVLFK SQIEKEGVEH 

QLRREIEIQA HLHHPNILRD YNYFYDRRRI YLILEYAPRG ELYKELQKSC TFDEQRTATI 

MEELADALMY CHGKKVIHRD IKPENLLLGL KGELKIADFG WSVHAPSLRR KTMCGTLDYL 

PPEMIEGRMH NEKVDLWCIG VLCYELLVGN PPFESASHNE TYRRIVKVDL KFPASVPTGA 

QDIilSKLLRH NPSERLjPLAQ VSAHPWVRAN SRRVLPPSAL QSVA 



Seq ID NO: 482 DNA sequence 
Nucleic Acid Accession #; AK055663 
Coding sequence: 38.. 1423 



1 11 21 31 41 51 

I 1 I 1 1 1 

AGAACGGCTT CCGGCGGGAG CTGTGCAGCT CCTTATCATG GGGACAATTC ATCTCTTTCG 

AAAACCACAA AGATCCTTTT TTGGCAAGTT GTTACGGGAA TTTAGACTTG TAGCAGCTGA 

CCGAAGGTCC TGGAAGATAC TGCTCTTTGG TGTAATAAAC TTGATATGTA CTGGCTTCCT 

GCTTATGTGG TGCAGTTCTA CTAATAGTAT AGCTTTAACT GCCTATACTT ACCTGACCAT 

TTTTGATCTT TTTAGTTTAA TGACATGTTT AATAAGTTAC TGGGTAACAT TGAGGAAACC 

TAGCCCTGTC TATTCATTTG GGTTTGAAAG ATTAGAAGTC CTGGCTGTAT TTGCCTCCAC 

AGTCTTGGCA CAGTTGGGAG CTCTCTTTAT ATTAAAAGAA AGTGCAGAAC GGTTTTTGGA 

ACAGCCCGAG ATACACACGG GAAGATTATT AGTTGGTACT TTTGTGGCTC TTTGTTTCAA 

CCTGTTCACG ATGCTTTCTA TTCGGAATAA ACCTTTTGCT TATGTCTCAG AAGCTGCTAG 

TACGAGCTGG CTTCAAGAGC ATGTTG C AG A TCTTAGTCGA AGCTTGTGTG GAATTATTCC 

GGGACTTAGC AGT AT CTTCC TTCCCCGAAT GAATCCATTT GTTTTGATTG ATCTTGCTGG 

AGCATTTGCT CTTTGTATTA CATATATGCT CATTGAAATT AATAATTATT TTGCCGTAGA 

CACTGCCTCT GCTATAG CT A TTGCCTTGAT GACATTTGGC ACTATGT AT G CCATGAGTGT 

GTACAGTGGG AAAGTCTTAC TCCAGACAAC ACCACCCCAT GTTATTGGTC AGTTGGACAA 

ACTCATCAGA GAGGTATCTA CCTTAGATGG AGTTTTAGAA GTCCGAAATG AACATTTTTG 

GACCCTAGGT TTTGGCTCAT TGGCTGGATC AGTGCATGTA AGAATTCGAC GAGATGCCAA 

TGAACAAATG GTTCTTGCTC ATGTGACCAA CAGGCTGTAC ACTCTAGTGT CTACTCTAAC 

TGTTCAAATT TTCAAGGATG ACTGGATTAG GCCTGCCTTA TTGTCTGGGC CTGTTGCAGC 

CAATGTCCTA AACTTTTCAG ATCATCACGT AATCCCAATG CCTCTTTTAA AGGGTACTGA 

TGATTTGAAC CCAGTTACAT CAACTCCAGC TAAACCTAGT AGTCCACCTC CAGAATTTTC 

ATTTAACACT CCTGGGAAAA ATGTGAACCC AGTTATTCTT CTAAACACAC AAACAAGGCC 

TTATGGTTTT GGTCTCAATC ATGGACACAC ACCTTACAGC AGCATGCTTA ATCAAGGACT 

TGGAGTTCCA GGAATTGGAG CAACTCAAGG ATTGAGGACT GGTTTTACAA ATATACCAAG 

TAGATATGGA ACTAATAATA GAAT TGGAC A ACCAAGACCA TGATAGACTC TAACTTATTT 

TTATAAGGAA TATTGACTCC TTGGCTTCCA ATTTATTTAG TAATCCAACT TTGCATTGAC 

TGTTTAATCA TTTACTCTAA ATGTTAGATA ATAGTAGTCT TGTTCACATT TCATGAAACC 

TATGAAACTA TATTTTTGTA AAATGTATTT GTGACAGTGA AATCCTCGTA AATGTTAAAG 

GCTTTAAATA GGCTTCCTTT AGAAAATGTG TTTCTTTAAA TTTGGATTTT GGTATCTTTG 

GT T T T GT AGT TGACTGCAGT GTGATGTGAC CTTACCTTTA TAAGAGCCAC TTGATGGAGT 

AGATCTGTCA CATTACTAAG ATACGATATT TCTTTTTTTT TCCGAGACGG AGTCTTGCTC 

TGCCACTGTG CCCGGCCAAT ACATTATTAT TAACTTAAGG CTGTACTTTA TT AAGGCTT C 

CTTAGTTTTT GTTTTGTTTT GTTTTTTGAG ATGGAGTCTC ACTCTGTCGC CCAGGCTGGA 

ATGCAGTGGC ATGATCTCAG CTCACTGCAA CCTCTGCCTC CTGAGTTCAA ATGATTCTCC 

TGCCTCAGCC TCCCGAGTAG CTGGGATTAC AGGCACCTGC CACCACGCCC AGCTAATTTT 

TGTATT TTTA GTAAAGACGG GGGATTTCAC CATGTTGGCC AGGCTGGTCT TGAACTCCTG 

ACCTCATGAT CCACCCACCT TAGCCTCCCA AAGTGCTGGG ATTAGGTGTG AGCCACCGCA 

CCTGGCCGAT ATTTTCTTTA ATGAAATTTA TAAATATGCT T CTTGAATAA TACACATTTT 

GGGAAAGGGA AAAATGTCTG TTCAAAAAGT AAAGGTCTCT TTTATAGCTT TTCCAAACTT 

AATTGCTAAA TTTTTCTTTG AGGTTCTCCT GAATTATGTC TTACAAACTA AAAGCAAAAA 

TTTTTAGCAG AAATTTTGGA ATACATTCTA TCTAGCACAA TTTGAATTTT TAATTATCAA 

GATTTTTGTT AAAGTTTCTC TCCTTTAAAA ATTTTAGTAC ATTTGTAAAT 



Seq ID NO: 483 Protein sequence 
Protein Accession #: BAB70980.1 

1 11 21 31 41 51 

I I 1 1 I I 

MGTIHLFRKP QRSFFGKLLR EFRLVAADRR SWKILLFGVI NLICTGFLLM WCSSTNSIAL 

TAYTYLT I FD LFSLMTCLIS YWVTLRKPSP VYSFGFERLE VLAVFASTVL AQLGALFILK 

ESAERFLEQP EIHTGRLLVG TFVALCFNLF TMLSIRNKPF AYVSEAASTS WLQEHVADLS 

RSLCGIIPGL SSIFLPRMNP FVLIDLAGAF ALCITYMLIE INNYFAVDTA SAIAIALMTF 

GTMYPMSVYS GKVLLQTTPP HVIGQLDKLI REVSTLDGVL EVRNEHFWTL GFGSLAGSVH 

VRIRRDANEQ MVLAHVTNRL YTLVSTLTVQ IFKDDWIRPA LLSGPVAANV LNFSDHHVIP 

MPLLKGTDDL NPVTSTPAKP SSPPPEFSFN TPGKNVNPVI LLNTQTRPYG FGLNHGHTPY 

SSMLNQGLGV PGIGATQGLR TGFTNIPSRY GTNNRIGQPR P 



Seq ID NO: 484 DNA sequence 

Nucleic Acid Accession #: FGENESH predicted 
Coding sequence: 1..900 

1 11 21 31 41 51 

I 1 I I I I 

ATGCCGCCGC GGGAGCTGAG CGAGGCCGAG CCGCCCCCGC TCCGGGCCCC GACCCCTCCC 

CCGCGGCGGC GTAGCGCGCC CCCAGAGCTG GGCATCAAGT GCGTGCTGGT GGGCGACGGC 

GCCGTGGGCA AGAGCAGCCT CAT CGTCAGC TACACCTGCA ATGGGTACCC CGCGCGCTAC 

CGGCCCACTG CGCTGGACAC CTTCTCTGGT ACGTACGTTC AATCGCCCGT GCGGCCGCGT 

GGCTGCGGCG GGGCTGTGCA CCGGGGAGCT GGGGCGGGCG TCTCGGCGGG AGGGCGCAGA 

GGACCCCGGG GAGGAGACTG GAGCAGGCCC CGAGGTGGCG CTGGTGCGGC CCAGGACGCT 

CTTCCTAACT CAGGCTCTCC CCGCCCCGCC CCTGCAGTGC AAGTCCTGGT GGATGGAGCT 

CCGGTGCGCA TTGAGCTCTG GGACACAGCG GGACAGGAGG ATTTTGACCG ACTTCGTTCC 

CTTTGCTACC CGGATACCGA TGTCTTCCTG GCGTGCTTCA GCGTGGTGCA GCCCAGCTCC 

TTTCAAAACA TCACAGAGAA ATGGCTGCCC GAGATCCGCA CGCACAACCC CCAGGCGCCT 

GTGCTGCTGG TGGGCACCCA GGCCGACCTG AGGGACGATG T CAACGT AC T AATTCAGCTG 



371 



WO 02/086443 

GACCAGGGGG GCCGGGAGGG CCCCGTGCCC CAACCCCAGG CTCAGGGTCT GGCCGAGAAG 720 

ATCCGAGCCT GCTGCTACCT TGAGTGCTCA GCCTTGACGC AGAAGAACTT GAAGGAAGTA 7 80 

TTTGACTCGG CTATTCTCAG TGCCATTGAG CACAAAGCCC GGCTGGAGAA GAAACTGAAT 840 

GCCAAAGGTG TGCGCACCCT CTCCCGCTGC CGCTGGAAGA AGTTCTTCTG CTTCGTTTGA 



PCT/US02/12476 



Seq ID NO: 485 Protein sequence 
Protein Accession #: FGENESH predicted 



10 



15 



MPPRELSEAE 
RPTALDTFSG 
LPNSGSPRPA 
FQNITEKWLP 
IRACCYLECS 



11 
I 

PPPLRAPTPP 
TYVQSPVRPR 
PAVQVLVDGA 
EIRTHNPQAP 
ALTQKNLKEV 



21 
I 

PRRRSAPPEL 
GCGGAVHRGA 
PVRIELWDTA 
VLLVGTQADL 
FDSAILSAIE 



31 
I 

GIKCVLVGDG 
GAGVSAGGRR 
GQEDFDRLRS 
RDDVNVLIQL 
HKARLEKKLN 



41 



51 



AVGKSSLIVS 


YTCNGYPARY 


60 


GPRGGDWSRP 


RGGAGAAQDA 


120 


LCYPDTDVFL 


ACFSWQPSS 


180 


DQGGREGPVP 


QPQAQGLAEK 


240 


AKGVRTLSRC 


RWKKFFCFV 





20 



Seq ID NO: 486 DNA sequence 

Nucleic Acid Accession #: XM_063832.2 

Coding sequence: 1..711 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



ATGCCGCCGC 
CCGCGGCGGC 
GCCGTGGGCA 
CGGCCCACTG 
ATTGAGCTCT 
CCGGATACCG 
ATCACAGAGA 
GTGGGCACCC 
GGCCGGGAGG 
TGCTGCTACC 
GCTATTCTCA 
GTGCGCACCC 



11 
] 

GGGAG CTGAG 
GTAGCGCGCC 
AGAGCAGCCT 
CGCTGGACAC 
GGGACACAGC 
ATGTCTTCCT 
AATGGCTGCC 
AGGCCGACCT 
GCCCCGTGCC 
TTGAGTGCTC 
GTGCCATTGA 
TCTCCCGCTG 



21 
I 

CGAGG CCGAG 
CCCAGAGCTG 
CATCGTCAGC 
CTTCTCTGTG 
GGGACAGGAG 
GGCGTGCTTC 
CGAGATCCGC 
GAGGGACGAT 
CCAACCCCAG 
AGCCTTGACG 
GCACAAAGCC 
CCGCTGGAAG 



31 

I 

CCGCCCCCGC 
GGCAT CAAGT 
TACACCTGCA 
CAAGT CCTGG 
GATTTTGACC 
AGCGTGGTGC 
ACGCACAACC 
GTCAACGTAC 
GCTCAGGGTC 
CAGAAGAACT 
CGGCTGGAGA 
AAGTTCTTCT 



41 



51 



TCCGGGCCCC 
GCGTGCTGGT 
ATGGGTACCC 
TGGATGGAGC 
GACTTCGTTC 
AGCCCAGCTC 
CCCAGGCGCC 
TAATTCAGCT 
TGGCCGAGAA 
TGAAGGAAGT 
AGAAACTGAA 
GCTTCGTTTG 



GACCCCTCCC 60 

GGGCGACGGC 120 

CGCGCGCTAC 180 

TCCGGTGCGC 240 

CCTTTGCTAC 300 

CTTTCAAAAC 360 

TGTGCTGCTG 420 

GGACCAGGGG 480 

GATCCGAGCC 540 

ATTTGACTCG 600 

TGCCAAAGGT 660 
A 



Seq ID NO: 487 Protein sequence 
Protein Accession #: XP 063832.1 



11 



21 



31 



41 



51 



1 
I 

MPPRELSEAE PPPLRAPTPP PRRRSAPPEL GIKCVLVGDG AVGKSSLIVS YTCNGYPARY 
RPTALDTFSV QVLVDGAPVR IELWDTAGQE DFDRLRSLCY PDTDVFLACF SWQPSSFQN 
ITEKWLPEIR THNPQAPVLL VGTQADLRDD VNVLIQLDQG GREGPVPQPQ AQGLAEKIRA 
CCYLECSALT QKNLKEVFDS AILSAIEHKA RLEKKLNAKG VRTLSRCRWK KFFCFV 

Seq ID NO: 488 DNA sequence 

Nucleic Acid Accession #: NM__0143 98.1 

Coding sequence: 64.. 13 14 



GGCACCGATT 
ACCATGCCCC 
CACGATGGCA 
ACTGCAGCAG 
CCTCACCAAA 
ACAGTAAAAA 
ATTACCTACA 
GTTACTGAAG 
CCACCAGCTC 
ACTCAACCCA 
ACAACCGGTC 
AATACCACCC 
CCATCGTCAG 
GCAGAGATGG 
TACTTCAACA 
AACCTTCTGT 
TCATATTATA 
CAAGGAATCA 
GTGAGTGAAC 
CTTCAAGCCT 
TACACAATTG 
GGTGT CTAT A 
CCCGGGGGGA 
TTGGGAAATT 
AATGAAGTGA 
GTTTATTTTA 
GCCACTCAAA 
AGCCTTCAAA 
ATTTTATTTT 
GCTTTTACTA 
ACTCCTTTTC 
CAGGCTGGAG 
TGATTCTCCT 
GCTAATTTTT 
CTCTTGACCT 
AGCCATTGCG 



11 
I 

CGGGGCCTGC 
GGCAGCTCAG 
GTCAAATGAG 
CAACAGTACA 
CTTTAGCAGC 
TTCCAACAAC 
CCCTGGTCAC 
TTACAGTCGG 
ATACAGCTGG 
GTAACCAGAC 
AGAAGCCTGA 
GCACAGCTGC 
TCAAGACTGG 
GGATACAGCT 
TCGACCCCAA 
TGAATTTTCA 
TCAGTGAAGT 
AACATGCGGT 
AGAGCCT CCA 
TTGATTTTGA 
TGCTTCCTGT 
AAATCCGCCT 
AT G AAAATAA 
CCCTCAGAGT 
GTCATGTGTG 
TGAAAGATAT 
GTCAACATTT 
TTATAAACCA 
ACCCTTGATC 
TCTGTGTTTT 
CACTTTAAAT 
TACAGTGGCA 
GCTTCAGCTT 
GTATTTTTAT 
CAGGTGATCC 
CCCGGCCTTA 



21 

I 

CCGGACTTCG 
CGCGGCGGCC 
AGCAAAAGCA 
GGACATAAAA 
AAGATTCATG 
TACCCCAGCA 
AACCCAGGCC 
CCCTAGCTTA 
AACCAGTTCA 
CACCCTTCCA 
TCAACCCACC 
ACCTGCCTCC 
AATTTAT CAG 
GATTGTT CAA 
CGCAACGCAA 
GGGCGGATTT 
GGGAGCCTAT 
GGTGATGTTC 
GTTGTCAGCC 
AGATGACCAC 
GATTGGGGCC 
AAGGTGTCAA 
TGGAATTTAG 
GTGGGTCCTT 
ATTTAAGTTC 
AGTGAGCTGT 
GAGATATGTT 
AGGGTCAATT 
TTAACAAAGC 
ATGGTTTCAT 
TTGTTTTTGT 
CGATCTCGGC 
CCCGAGTAGC 
TATAGACGGG 
ACCCACCTCA 
AATGTTTTTT 



31 
I 

CCGCACGCTG 
GCGCTCTTCG 
TTTCCAGAAA 
AAACCTGTCC 
GATGGTCATA 
ACTACAAAAA 
ACACCCAACA 
GCCCCTTATT 
TCAACCGTCA 
GCAACTTTAT 
CATGCCCCAG 
ACGGTTCCTG 
GTTCTAAACG 
GACAAGGAGT 
GCCTCTGGGA 
GTGAATCTCA 
TTGACCGTCT 
CAGACAGCAG 
CACCTGCAGG 
TTTGGAAATG 
ATCGTGGTTG 
TCATCTGGAT 
AGAACTCTTT 
CAAACAATGT 
AGGCAGCACA 
TTATTTTCTA 
GAATTAACAT 
GTAACTAATA 
CTTTGCTTTG 
GTAACATACA 
TTTTTGAGAC 
TTATGGCAAC 
TGGGATTACA 
TTT CACCATG 
GCCTCCCAAA 
TTAATCATCA 



41 
I 

CAGAACCTCG 
CGTCCCTGGC 
CCAGAGATTA 
AGCAACCAGC 
TCACCTTTCA 
ACACTGCAAC 
ACTCACACAC 
CACTGCCACC 
GCCACACAAC 
CGATAGCACT 
GAACAACGGC 
GGCCCACCCT 
GAAGCAGACT 
CGGTTTTTTC 
ACTGTGGCAC 
CATTTACCAA 
CAGATCCAGA 
TCGGGCATTC 
TGAAAACAAC 
TGGATGAGTG 
GTCTCTGCCT 
ACCAGAGAAT 
CATCCCTTCC 
AAACCACCAT 
TCAATTTCTA 
GTTTCCTTTA 
AATATATGTA 
CTACTGTGTG 
TTATCAAATG 
TATTCCTGGT 
GGAGTTTCAC 
CTCCGCCTCC 
GGCACACACT 
TTGGCCAGAC 
GTGCTGGGAT 
AAAAGAACAA 



51 
I 

CCCAGCGCCC 
CGTAATTTTG 
TTCTCAACCT 
TAAGCAAGCA 
AACAGCGGCC 
CACCAGCCCA 
AGCTCCTCCA 
CACCATCACC 
TGGGAACACC 
GCACAAAAGC 
AGCTGCCCAC 
TGCACCTCAG 
CTGTATAAAA 
ACCTCGGAGA 
CCGAAAATCC 
GGATGAAGAA 
GACAGTTTAC 
CTTCAAGTGC 
CGATGTCCAA 
CTCGTCTGAC 
TATGGGTATG 
CTAATTGTTG 
AGGATGGATG 
CTTCTATTCA 
AATACTTTTT 
GAATATTTTA 
AAGTAGAATA 
TGCATTGAAG 
GACTTTCAGT 
GTAG CACTT A 
TCTTGTCACC 
CGGGTTCAAG 
ACCACGCCTG 
TGGTCTTGAA 
TACAGGCATG 
CATATCT CAG 



60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 



372 



10 



15 



WO 02/086443 

GTTGTCTAAG TGTTTTTATG 
CTTGATGACT CCTGCTCCAG 
CTAAACAATA AGCAAGAGAC 
TAGGCTAAGC ACTTTATCTA 
ACTGAGACTT AAGGGAACTG 
GAGCTTGAAT TCATGTTGGT 
CCTACAAGAA CAATGACACC 
TCACCTTACA GGGAAATGGG 
AGCTTTGCAG ATAACAAAAT 
TGAGGGGCTT TGTAAAACAT 
GTAAAGATGA AGGCAT CAAA 
ACTTCGCTAA CCAACTGTTC 
TTCTGCACTT CATATCCATA 
GAATTTT AT T TCTGCTGTTT 
AGAAAAGTCC ACATAACCCT 
CCATGTTGAC TTTCCTCATG 
TAGTCTTAAT AAAACATTGA 



TAAAACCAAC 
AATTGCTAGA 
AATAATAATG 
TATCTCATTT 
AATCACTTAA 
CTGACATCAA 
ACACTCTGCC 
TTTATCCAGG 
AGCCTATCCT 
TAGTCAGTTG 
TAAACTCAAA 
TTTCTTGAGT 
TTTCCTATTG 
TTTTTGCTGC 
AGAATTCTTA 
TGTTTCCTTA 
ATTGTAGTAA 



AAAAAGAACA 
CTAAGAATTA 
GCCCTTAATT 
CATTCTCACA 
ATGTCACCTG 
GGTCTTTGGT 
TGAAGG CTCA 
ATCATGAGAC 
TAATAAATCC 
CTCATTTTTA 
GTATTTTTAA 
GTATAGCCCC 
TTCACTTTAT 
TAAAGAAAGG 
GTCAAGGAAT 
TGACTCAGTA 
AGGTTTTTGC 



AATCAGCTTA 
GGTGGCTACA 
AT T AACAAAG 
ACTTATAAGT 
GCTAACTGAT 
CTTCTCCCTA 
CACCTCATAC 
ATTAGGGTAG 
TCCACTCTCT 
TGGGATTGCT 
ATTTTTTTGA 
ATCTTGTGGT 
TCTGTAGAGC 
AACTAAGTCA 
AATTCAAGTC 
AGTTGGCAAG 
AATAAAAACT 



TATTTTTTAT 2220 

GATGGTAGAA 2280 

TGCCAGAGTC 2340 

GAATGAGTAA 240 0 

GGCAGAGCCA 2460 

CACCAAGTTA 252 0 

CAGCATACGC 2580 

ATGAAAGGAG 2640 

GGAAGGAG AC 2 700 

TAGCTGGGCT 2760 

T AAT AGAGAA 282 0 

AACTTGCTGC 2 880 

AGCCTGCCAA 2940 

GGATGTTAAC 3000 

AGCCTAGAGA 3060 

GTCCTGACTT 3120 
TACTTTGG 



PCT/US02/12476 



Seq ID NO: 489 Protein sequence 
20 Protein Accession #: NP 055213.1 



25 



30 



I 

MPRQLSAAAA 
HQTLAARFMD 
TEVTVGPSLA 
TGQKPDQPTH 
EMGIQLIVQD 
YYISEVGAYL 
QAFDFEDDHF 



11 
I 

LFASLAVILH 
GHITFQTAAT 
PYSLPPTITP 
APGTTAAAHN 
KESVFSPRRY 
TVSDPETVYQ 
GNVDECSSDY 



21 
I 

DGSQMRAKAF 
VKIPTTTPAT 
PAHTAGTSSS 
TTRTAAPAST 
FNIDPNATQA 
G I KHAWMFQ 
TIVLPVIGAI 



31 

I 

PETRDYSQPT 
TKNTATTSPI 
TVSHTTGNTT 
VPGPTLAPQP 
SGNCGTRKSN 
TAVGHSFKCV 
WGLCLMGMG 



41 

I 

AAATVQD I KK 
TYTLVTTQAT 
QPSNQTTLPA 
SSVKTGIYQV 
LLLNFQGGFV 
SEQSLQLSAH 
VYKIRLRCQS 



51 
I 

PVQQPAKQAP 60 

PNNSHTAPPV 12 0 

TLSIALHKST 180 

LNGSRLCIKA 240 

NLTFTKDEES 300 

LQVKTTDVQL 360 
SGYQRI 



35 



Seq ID NO: 490 DNA sequence 

Nucleic Acid Accession #: NM_005409.3 

Coding sequence: 94.. 3 78 



40 



45 



50 



55 



11 



60 



TTCCTTTCAT 
CAACAGCACC 
TTGGCTGTGA 
TGTCTTTGCA 
ATAATGTACC 
AAAGGACAAC 
GAAAGAAAGA 
AACCTAGAAC 
AGACTTTTCT 
GGGTGAAAGG 
CTGCCCAAAG 
GGTTACCATC 
GCATTTCTAG 
GAGAACATTT 
CTGTGGTTAC 
CATCTATGTG 
CCAAATATCA 
TTTATAACCA 
TGGGATACTG 
GATGTTTTTC 
TGTACTTTTT 
TACAAAATGT 
AATCACTTTT 
TTGTTCATGC 
GTCATTTTTT 



GTTCAGCATT 
AGCAGCAACA 
TATTGTGTGC 
TAGGCCCTGG 
CAAGTAACAA 
GATGCCTAAA 
ATTTTTAAAA 
AAGTTTAACT 
ATGGTTTTGT 
ACCAAAAACA 
GAGTCCAGCA 
GGAGTTTACA 
GCTAGAGAAC 
CTGTCTCTAG 
AGTGGAGACA 
TCGTAAAGCA 
TGTAGCACAT 
ATTCATTAAA 
GCAACAGTGC 
AACTTTTATT 
GTTTTGATCC 
TTTTGTCTAC 
ACTTTTTGTA 
CTATATACTG 
TCTCTAATAA 



21 
1 

TCTACTCCTT 
GCAAAAAACA 
TACAGTTGTT 
GGTAAAAGCA 
CTGTGACAAA 
TCCCAAATCG 
ATATCAAAAC 
GTGACTACTG 
GACTTTCAAC 
GAAATACAGT 
ATTAAATGGA 
AAGTGCTTT C 
CTTCTAGATT 
AAGTTATCTG 
TTGACATTAT 
TTCCTCAAAC 
CAATATGTAG 
TGTAATTCAT 
ACATATTTCA 
CATTGAGATG 
GTTTGTATAA 
CAAAGAAAAA 
ATTCTGTCTC 
TAAAATTTAG 
ACTACCACAA 



31 

I 

CCAAGAAGAG 
AACATGAGTG 
CAAGGCTTCC 
GTGAAAGTGG 
ATAGAAGTGA 
AAGCAAGCAA 
AT ATGAAGT C 
AAATGA CAAG 
TTTTGTACAG 
CTTCCTGAAT 
TTTCTAGGAA 
ACGTTCTTAC 
TGATGCTTAC 
TCTGTATTGA 
TACTGGAGTC 
ATTTTTTCAT 
GGAAACATTC 
AAAATGTACT 
TAACCAAATT 
TTTTGAAGCA 
ATGATAGCAA 
TGTTGAAAAA 
TTAGAAAAAT 
GTATACTCAA 
CCTTTCTTTT 



41 

I 

CAGCAAAGCT 
TG AAGGG CAT 
CCATGTTCAA 
CAGATATTGA 
TTATTACCCT 
GGCTTATAAT 
CTGGAAAAGG 
AATTCTACAG 
TTATGTGAAG 
GAATGACAAT 
AAGCTACCTT 
TTGTTGTATT 
AACTATTCTG 
TCTTTATGCT 
AAGCCCTTAT 
GCAAATACAC 
TTATGCATCA 
ATGAAAAAAA 
AGCAGCACCG 
ATTAGGATAT 
TATCTTGGAC 
TAAGCAAATG 
ACATAATCTA 
GACTAGTTTA 
TTAAAAAAAA 



51 
] 

GAAGTAGCAG 60 

G G CT AT AG C C 12 0 

AAGAGGACGC 180 

GAAAGCCTCC 240 

GAAAGAAAAT 300 

CAAAAAAGTT 360 

GCAT CTG AAA 420 

TAGGAAACTG 480 

GATGAAAGGT 540 

CAGAATTCCA 600 

AAGAAAGGCT 660 

ATACATTCAT 720 

TTGTGACTAT 780 

ATATTACTAT 840 

AAGTCAAAAG 90 0 

ACTTCTTTCC 960 

TTTGGTTTGT 1020 

TTATACGCTA 1080 

GTCTTAATTT 1140 

GTGTGTTTAC 1200 

ACATTTGAAA 1260 

TATACCTAGC 1320 

ATCAATTTCT 1380 

AAG AAT CAAA 1440 
AAA 



65 



70 



Seq ID NO: 491 Protein sequence 
Protein Accession #: NP_005400.1 

1 11 21 31 41 51 

I I I I I I 

MSVKGMAIAL AVILCATWQ GPPMPKRGRC LCIGPGVKAV KVADIEKASI MYPSNNCDKI 

EVIITIiKENK GQRCLNPKSK QARLIIKKVE RKNP 



60 



75 



80 



85 



Seq ID NO: 492 DNA sequence 

Nucleic Acid Accession #: NM_000577.1 

Coding sequence: 41.. 520 



GGCACGAGGG 
CCGACCCTCT 
GAAGACCTTC 
CAATTTAGAA 
CCATGGAGGG 
GGAGGCAGTT 
CATCCGCTCA 
CCTCTGCACA 
CGT CATGGTC 
TCCCATTCTT 



11 
I 

GAAGACCTCC 
GGGAGAAAAT 
TAT CTGAGG A 
GAAAAGATAG 
AAGATGTGCC 
AACATCACTG 
GACAGTGGCC 
GCGATGGAAG 
ACCAAATTCT 
GCATGGCAAG 



21 

i 

TGTCCTATCA 
CCAG CAAG AT 
ACAACCAACT 
ATGTGGTACC 
TGTCCTGTGT 
ACCTGAGCGA 
CCACCACCAG 
CTGACCAGCC 
ACT TCCAGGA 
GACTGCAGGG 



31 

1 

GGCCCTCCCC 
GCAAGCCTTC 
AGTTGCCGGA 
CATTGAGCCT 
CAAGTCTGGT 
GAACAGAAAG 
TTTTGAGTCT 
CGTCAGCCTC 
GGACGAGTAG 
ACTGCCAGTC 



41 

1 

ATGGCTTTAG 
AGAATCTGGG 
TACTTGCAAG 
CATGCTCTGT 
GATGAGACCA 
CAGGACAAGC 
GCCGCCTGCC 
ACCAATATGC 
TACTGCCCAG 
CCCCTGCCCC 



51 
I 

AGACGATCTG 60 

ATGTTAACCA 120 

GACCAAATGT 180 

TCTTGGGAAT -240 

GACTCCAGCT 300 

GCTTCGCCTT 360 

CCGGTTGGTT 420 

CTGACGAAGG 480 

GCCTGCCTGT 540 

AGGGCTCCCG 60 0 



373 



10 



15 



20 



WO 02/086443 

GCTATGGGGG CACTGAGGAC 
CCTGGTCACA GGACTCTGCC 
GTCTTTCTAA TGTGTGAATC 
TCTGCATTCA GGATCAAACC 
CTTCCTCCCT CATTCCACCT 
ACCAAGTGGC TCCCACACCC 
TTTAAGGGTT TGTGGAAAAT 
GAAGGAGAGC CCTTCATTTG 
ATTCCTGCAT TTGTGAAATG 
TTTTTTTGTG ATGTCCCAAC 
ATTTTTTTTT TCCTTTTAAA 
CCCAGCCTCC AAGCTCCATC 
TCCTATCAGA AGTTTCTCAG 
TCTTCCTCTG CTGAAGGAAT 
ACTTGTATGA AAGATGG CTG 
GAGCAGGAAA CATGACTCGT 
CTCTTGGCAG GTACTCAGCG 
CTGTGACTTC AGCTCTGTTT 
AAAAAAAAAA AAAAAAAAAA 



PCT/US02/12476 



CAGCCATTGA 
TCCTCTTCAA 
AGAGCACAGC 
CCGACCACCT 
TCCCATGCCC 
TGTTTTACAA 
GAAAATTAGG 
GAGATTATGT 
ATGGTGAAAG 
TTGTAAAAAT 
ACACTTCCAT 
TCCACTCCAG 
CTCCCAAGGC 
AAATTGCTCC 
TGCCTCTGCC 
ATATGTCTCA 
AATGAATGCT 
TACAATAAAA 
AAAAAAAAAA 



GGGGTGGACC 
CTGACCAGCC 
AGCCCCTGCA 
GCCCAACCTG 
TGGATCCATC 
AAAAGAAAAG 
ATTTCATGAT 
TCTTTCGGGG 
TAAGTGGTAG 
TAAAAGTTAT 
AAT CTGG ACT 
ATTTTTTACA 
TCTGAGCAAA 
TTGACATTGT 
TGTCTCCCCC 
GGTCCCTGCA 
GTATATGTTG 
TCTTGAAAAT 
AAAAAA 



CTCAGAAGGC 
TCCATGCTGC 
CAAAGCCCTT 
CTCTCCTCTT 
AGGCCACTTG 
ACCAGTCCAT 

t t i' t i* ^ 1 Tr 

AGAGGCTGAG 
CTTTTCCCTT 
GGTACTATGT 
CCTCTGTCCA 
GCTGCCTGCA 
TGTGGCTCCT 
AGAGCTTCTG 
ACCAGGCTGG 
GGGCCAAGCA 
GGTGCAAAGT 
GCCTAAAAAA 



GTCACAACAA 660 

CTCCAGAATG 720 

CCATGTCGCC 780 

GCCACTGCCT 840 

ATGACCCCCA 900 

GAGGGAGGTT 960 

CAGTCCCCGT 102 0 

GACTTAAAAT 1080 

CTTTTTCTTC 1140 

TAGCCCCATA 12 0 0 

GGCACTGCTG 1260 

GTACTTTACC 132 0 

GGGGGTTCTT 13 80 

GCACTTGGAG 1440 

GAGCTCTGCA 1500 

CCTAGCCTCG 1560 

TCCCTACTTC 1620 

AAAAAAAAAA 1680 



Seq ID NO : 4 93 Protein sequence 
Protein Accession #: NP 000568.1 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



1 11 21 31 41 SI 

I I I I I I . 

MALETICRPS GRKSSKMQAF RIWDVNQKTF YLRNNQLVAG YLQGPNVNLE EKIDWPIEP 

HALFLGIHGG KMCLSCVKSG DETRLQLEAV NITDLSENRK QDKRFAFIRS DSGPTTSFES 

AACPGWFLCT AMEADQPVSL TNMPD EGVMV TKFYFQEDE 

Seq ID NO: 494 DNA sequence 

Nucleic Acid Accession #: NM_002081.1 

Coding sequence: 222.. 1898 



60 
120 



85 



GGCTGCCCGA 
GGCTTTTGTT 
CGGGACCTTG 
AGAGGCGCGG 
GCTGGTGGCT 
GCAAGAGCCG 
GCGACGTGCC 
CCTGCTGCAC 
CCGCGCTCCG 
TCGATGACCA 
CCGGCGCCTT 
AGCTGCGCCT 
GGGCCCGCCT 
ACTACCTGGA 
GAGAGCTGCG 
TGGGCGTGGC 
CGAGAGCTGT 
CCTGCCCTGA 
ACGCCGAGTG 
CATCGGGTGT 
CCCTCCAGGA 
AGGTCAACCC 
GGGAGAGGCC 
GCGACGT CCA 
TGAGCACTGC 
AGGTCATGGG 
CCAAGCCGGA 
TGCGCAGCGC 
GCTCGGGCAG 
GCTCCAGCTC 
AGAAGACCTC 
TCCTGGCCCT 
GAGGCCAAGG 
TGGAGAGGCC 
GTCCCAGCCC 
CAGGTCAGCT 
TCCGGCTGCC 
CTACAGAGGA 
CGCCTCCTCC 
CCTCCAGAGA 
TCTGAGATGA 
CTGCGCCCTT 
GGAGTCTGAG 
GGGGCCACTG 
GGAGGCAGCG 
GCCTTGCTGG 
CCTGCTCCCA 
CAGGGCTCAG 
CCCCGCACTG 
GCACGGGGAC 
TGTCCTTGTT 
CACCTTGGAC 



11 
I 

GCGAGCGTTC 
GTCTCCGCCT 
GCTCTGCCCT 
GCGGGTGGCC 
GCTATGTGCG 
GAGCTGCGGC 
CCAGGCGGAG 
CAGCGAGATG 
GGACAGCAGC 
CTTCCAGCAC 
CGGAGAGCTG 
GTACTACCGC 
GCTCGAGCGC 
CTGCCTGGGC 
CCTGCGGGCC 
CAGCGACGTG 
CATGAAGCTG 
CTATTGCCGA 
GAGGAACCTC 
GGAGAGTGTC 
CAACAGGGAC 
CCAGGGCCCT 
ACCTTCAGGC 
GGACTTCTGG 
CAGTGATGAC 
TGACGGCCTG 
CATGACCATC 
CTACAACGGC 
CGGTGATGGC 
CCGGACGCCC 
GGCTGCCAGC 
TACAGTAGCC 
ACTGACTTTG 
TGGGGTGGGA 
CAGGCCTGGC 
GGGAGCCAGT 
TAGCCCTCCC 
GGCCTCAAAG 
CACTGGGACT 
AGCCCCGCAC 
TGCATGATGC 
GAGGGGCCCC 
GACTGTCCTC 
ACCCACCTGC 
TGGGCTCTGC 
GGTCCAGGGC 
TCCTCACCCA 
AGTGACCCTC 
CACACGGGAA 
CTGGATAGTT 
CATGGAGAGC 
CCTGGTGACC 



21 
I 

GGACCTCGCA 
CCTCGGCCGC 
TCGCGGGCGG 
GGGGGCGCCG 
GCCGCAGCGC 
GAGGTCCGCC 
ATCTCGGGTG 
GAGGAGAACC 
CGCGTCCTGC 
CTGCTGAACG 
TACACGCAGA 
GGTGCCAACC 
CTCTTCAAGC 
AAGCAGGCCG 
ACCCGTGCCT 
GTCCGGAAAG 
GTCTACTGTG 
AATGTGCTCA 
CTGGACTCCA 
ATCGGCAGCG 
ACGCTCACGG 
GGGCCTGAGG 
ACGCTGGAGA 
ATCAGCCTCC 
CGCTGCTGGA 
GCCAACCAGA 
CGGCAGCAGA 
AACGACGTGG 
TGTCTGGATG 
TTGACCCATG 
TGCCCCCAGC 
AGGCCCCGGT 
CCAAAAATAC 
CAGGGAGGGC 
CTCGCCTGCC 
GTGCCCAAAA 
CCCAGCTCCC 
CAACCCGCTG 
CCCAGCAGAG 
GGGCTGTCTG 
CCTCCCCTCA 
AGCGTCTGCA 
CCACAGACCC 
GCTTCTGCTG 
CAATGTGGGC 
TGTTGGAGGA 
GATCAGGAAC 
GGCTGTCACC 
TGCCTAGGTC 
AAGGGCTTTT 
TGTTCGCTCC 
TCCTGTCACT 



31 



41 



CCCCGCGCGC 
CGCCGCCTCT 
GAACTGCGCA 
CCGGCCCCGC 
TGGTCGCCTG 
AGATCTACGG 
AGCACCTGCG 
TGGCCAACCG 
AGGCCATGCT 
ACTCGGAGCG 
ACGCGAGGGC 
TGCACCTGGA 
AGCTGCACCC 
AGGCGCTGCG 
TCGTGGCTGC 
TGGCTCAGGT 
CTCACTGCCT 
AGGGCTGCCT 
TGGT G C T CAT 
TGCACACGTG 
CCAAGGTCAT 
AGAAGCGGCG 
AGCTGGTCTC 
CAGGGACACT 
ACGGGATGGC 
TCAACAACCC 
TCATGCAGCT 
ACTT CCAGGA 
ACCTCTGCGG 
CCCTCCCAGG 
CCCCGACCTT 
GGCGGTAACT 
AACACAGACG 
CGGCGGCTCT 
TTTCTGCCTT 
GCCATGTATT 
TGCACCGCCG 
GAGCCCACAG 
CCCACCAGCC 
GGTGTCCGCC 
GCGCAGGCTG 
GGGTGACGCC 
TGCAGTGAGG 
GAG GAGGGGA 
TGCCCCTCGC 
CCCCGAGGGC 
CAGGGCCTCC 
TGCTCACAGG 
CCTTCCCGAC 
CCAAACATGC 
TCCCAGATGG 
CACTGAGGCC 



CCCGCGCCGC 
GGACCGCGAG 
GGACCCGGCC 
CATGGAGCTC 
CGCCCGCGGG 
AGCCAAGGGC 
GAT CTGTCCC 
CAGCCATGCC 
TGCCACCCAG 
GACGCTGCAG 
CTTCCGGGAC 
GGAGACGCTG 
CCAGCTGCTG 
GCCCTTCGGG 
TCGCTCCTTT 
CCCCCTGGGC 
GGGAGTCCCC 
TGCCAACCAG 
CACCGACAAG 
GCTGGCGGAG 
CCAGGGCTGC 
CCGGGGCAAG 
TGAAGCCAAG 
GTGCAGTGAG 
CAGAGGCCGG 
CGAGGTGGAG 
GAAGATCATG 
CGCCAGTGAC 
CCGGAAGGTC 
CCTGTCAGAG 
CCTCCTGCCC 
GCCCCAAGGC 
ATATTTAATT 
GAGCAGGGGC 
TTAATTTTGT 
TCAGGGACCT 
CAGAAGCAGC 
CGAGCCTGTG 
AGCCCTGGCC 
AT CCAGGGTC 
CAGAGCCCGG 
TGAGACAGCA 
GGCCCTCCAT 
AGCTGGGCCC 
ACACAGGGCT 
TGAGGAGCAG 
CTGTTCACGG 
GATGCTGGTG 
CCAGCCAGCT 
ATCCATTTAC 
CTTCGGAGGC 
AT CAGGGCCC 



51 
I 

CGCCGCCGCC 
CCGCGCGCGC 
AGGATCCGAG 
CGGGCCCGAG 
GACCCGGCCA 
TTCAGCCTGA 
CAGGGCTACA 
GAGCTGGAGA 
CTGCGCAGCT 
GCCACCTTCC 
CTGTACTCAG 
GCCGAGTTCT 
CTGCCTGATG 
GAGGCCCCGA 
GTGCAGGGCC 
CCGGAGTGCT 
GGCGCCAGGC 
GCCGACCTGG 
TTCTGGGGTA 
GCCATCAACG 
GGGAACCCCA 
CTGGCCCCGC 
GCCCAGCTCC 
AAGATGGCCC 
TACCTCCCCG 
GTGGACATCA 
ACCAACCGGC 
GACGGCAGCG 
AGCAGGAAGA 
CAGGAAGGAC 
CTCCTCCTCT 
CCCAGGGACA 
CACCTCAGCC 
AGGCGCAGAG 
ATGAGGTCCT 
CAGGGGCACC 
CCCTCGAGGC 
CCTTCCTCCC 
CACCCCCCAG 
TGGCAGAGCC 
CCCCACCTCC 
CCACTGCTGA 
GCGCAGATGA 
AAAGGCCCAG 
CACAGGGCAG 
CCAGGACCCG 
TGACACAGGT 
GCTGGTGAGA 
GCACTGCAGG 
TGACACTTCC 
CCGCAGGGCC 
TGCCCCAGGC 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
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GTGGACGGGC CCTCCTTCCC TCCTGTGCCC CAGCTGCCAG GTGGCCCTGG GGAGGGGTGG 3180 

TGTGGTGTTG GGAAGGGGTC CTGCAGGGGG AGGAGGACTT GGAGGGTCTG GGGGCAGCTG 3240 

TCCTGAACCG ACTGACCCTG AGGAGGCCGC TTAGTGCTGC TTTGCTTTTC ATCACCGTCC 3300 

CGCACAGTGG ACGGAGGTCC CCGGTTGCTG GTCAGGTCCC CATGGCTTGT TCTCTGGAAC 33 60 

5 CTGACTTTAG ATGTTTTGGG ATCAGGAGCC CCCAACACAG GCAAGTCCAC CCCATAATAA 342 0 

CCCTGCCAGT GCCAGGGTGG GCTGGGGACT CTGGCACAGT GATGCCGGGC GCCAGGACAG 3480 

CAGCACTCCC GCTGCACACA GACGGCCTAG GGGTGGCGCT CAGACCCCAC CCTACGCTCA 3540 

TCTCTGGAAG GGGCAGCCCT GAGTGGTCAC TGGTCAGGGC AGTGGCCAAG CCTGCTGTGT 360 0 

CCTTCCTCCA CAAGGTCCCC CCACCGCTCA GTGTCAGCGG GTGACGTGTG TTCTTTTGAG 3 660 
10 TCCTTGTATG AATAAAAGGC TGGAAACCTA AA 

Seg ID NO: 4 95 Protein sequence 
Protein Accession #: NP_0 02 072.1 

15 1 11 21 31 41 51 

I I 1 I I I 

MELRARGWWL LCAAAALVAC ARGDPASKSR SCGEVRQIYG AKGFSLSDVP QAEISGEHLR 60 

ICPQGYTCCT SEMEENLANR SHAELETALR DSSRVLQAML ATQLRSFDDH FQHLLNDSER 12 0 

TLQATFPGAF GELYTQNARA FRDLYSELRL YYRGANLHLE ETLAEFWARL LERLFKQLHP 18 0 

20 QLLLPDDYLD CLGKQAEALR PFGEAPRELR LRATRAFVAA RSFVQGLGVA SDWRKVAQV 240 

PLGPECSRAV MKLVYCAHCL GVPGARPCPD YCRNVLKGCL ANQADLDAEW RNLLDSMVLI 3 00 

TDKFWGTSGV ESVIGSVHTW LAEAINALQD NRDTLTAKVI QGCGNPKVNP QGPGPEEKRR 3 60 

RGKLAPRERP PSGTLEKLVS EAKAQLRDVQ DFWISLPGTL CSEKMALSTA SDDRCWNGMA 420 

RGRYLPEVMG DGLANQ INNP EVEVD I TKPD MTIRQQIMQL KIMTNRLRSA YNGNDVDFQD 480 
25 ASDDGSGSGS 

Seq ID NO: 496 DNA sequence 

Nucleic Acid Accession ft: NM_001650.2 

Coding sequence: 40.1011 

1 11 21 31 41 51 

l l l l l I 

GGGGCAGGCA ATGAGAGCTG CACTCTGGCT GGGGAAGGCA T G AGT G AC AG ACCCACAGCA 60 

AGGCGGTGGG GTAAGTGTGG ACCTTTGTGT ACCAGAGAGA A CAT C ATGGT GGCTTTCAAA 120 

35 GGGGTCTGGA CTCAAGCTTT CTGGAAAGCA GTCACAGCGG AATTTCTGGC CATGCTTATT 180 

TTTGTTCTCC TCAGCCTGGG ATCCACCATC AACTGGGGTG GAACAGAAAA GCCTTTACCG 240 

GTCGACATGG TTCTCATCTC CCTTTGCTTT GGACTCAGCA TTG CAACCAT GGTGCAGTGC 300 

TTTGGCCATA TCAGCGGTGG CCACATCAAC CCTGCAGTGA CTGTGGCCAT GGTGTGCACC 360 

AGGAAGATCA GCATCGCCAA GTCTGTCTTC TACATCGCAG CCCAGTGCCT GGGGGCCATC 420 

40 ATTGGAGCAG GAATCCTCTA TCTGGTCACA CCTCCCAGTG TGGTGGGAGG CCTGGGAGTC 480 

ACCATGGTTC ATGGAAATCT TACCGCTGGT CATGGTCTCC TGGTTGAGTT GATAATCACA 540 

TTTCAATTGG TGTTTACTAT CTTTGCCAGC TGTGATTCCA AACGGACTGA TGTCACTGGC 60 0 

TCAATAGCTT TAGCAATTGG ATTTTCTGTT GCAATTGGAC ATTTATTTGC AATCAATTAT 660 

ACTGGTGCCA GCATGAATCC CGCCCGATCC TTTGGACCTG CAGTTATCAT GGGAAATTGG 72 0 

45 GAAAACCATT GGATATATTG GGTTGGGCCC AT CAT AGGAG CTGTCCTCGC TGGTGGCCTT 780 

TATGAGTATG TCTTCTGTCC AGATGTTGAA TTCAAACGTC GTTTTAAAGA AGCCTTCAGC 840 

AAAGCTGCCC AGCAAACAAA AGGAAGCTAC ATGGAGGTGG AGGACAACAG GAGTCAGGTA 900 

GAGACGGATG ACCTGATTCT AAAACCTGGA GTGGTGCATG TGATTGACGT TGACCGGGGA 960 

GAGGAGAAGA AGGGGAAAGA CCAATCTGGA GAGGTATTGT CTTCAGTATG ACTAGAAGAT 1020 

50 CGCACTGAAA GCAGACAAGA CTCCTTAGAA CTGTCCT CAG ATTTCCTTCC ACCCATTAAG 1080 

GAAACAGATT TGTTATAAAT TAGAAATGTG CAGGTTTGTT GTTTCATGTC ATATTACTCA 1140 

GTCTAAACAA TAAATATTTC ATAATTTACA AAGGAGGAAC GGAAGAAACC TATTGTGAAT 1200 

TCCAAATCTA AAAAAAGAAA TATTTTTAAG ATGTTCTTAA GCAAATATAT ACCTATTTTA 1260 

TCTAGTTACC TTTCATTAAC AACCAATTTT AACCGTGTGT CAAGATTTGG TTAAGTCTTG 1320 

55 CCTGACAGAA CTCAAAGACA CGTCTAT CAG CTTATTCCTT CTCTACTGGA ATAT TGGTAT 1380 

AGTCAATTCT TATTTGAATA TTTATTCTAT TAAACTGAGT TTAACAATGG C 



60 



Seq ID NO: 497 Protein sequence 
Protein Accession #: NP 001641.1 



1 11 21 31 41 51 

I I I I i l 

MSDRPTARRW GKCGPLCTRE NIMVAFKGVW TQAFWKAVTA EFLAMLIFVL LSLGSTINWG 60 

GTEKPLPVDM VLISLCFGLS IATMVQCFGH ISGGHINPAV TVAMVCTRKI SIAKSVFYIA 12 0 

65 AQCLGAI IGA GILYLVTPPS WGGLGVTMV HGNLTAGHGL LVELI ITFQL VFTIFASCDS 180 

KRTDVTGSIA LAIGFSVAIG HLFAINYTGA SMNPARSFGP AVIMGNWENH WIYWVGPIIG 240 

AVLAGGLYEY VFCPDVEFKR RFKEAFSKAA QQTKGSYMEV EDNRSQVETD DLILKPGWH 300 
VIDVDRGEEK KGKDQSGEVL SSV 

70 Seq ID NO: 498 DNA sequence 

Nucleic Acid Accession ft: AB020684.1 
Coding sequence : 1 . . 1744 

1 11 21 31 41 51 

75 | | | | j I 

CCCCCTTGTC ATTAATACAT TAAAAAGATT CAATCTTTAC CCTGAGGTAA TTTTGGCCAG 60 

TTGGTACCGG ATTTATACCA AAATAATGGA CTTGATTGGT ATTCAAACCA AGATATGTTG 120 

GACGGTTACC AGAGGAGAAG GACTCAGTCC TATTGAAAGC TGTGAAGGAT TGGGAGATCC 180 

TGCTTGCTTT TATGTTGCTG TAATTTTTAT TTTAAATGGA CTAATGATGG CATTATTCTT 240 

80 CATATATGGC ACATATTTAA GTGGCAGCCG ATTAGGAGGC CTGGTTACAG TGTTGTGCTT 3 00 

CTTTTTCAAT CATGGAGAGT GTACCCGTGT AATGTGGACA CCACCTCTCC GTGAAAGCTT 360 

CTCATATCCA TTTCTTGTTC TTCAGATGTT GCTAGTGACT CATATTCTCA GGGCTACAAA 420 

ACTTTATAGA GGAAGCTTGA TTGCACTCTG CATTTCCAAT GTATTTTTCA TGCTTCCTTG 480 

GCAGTTTGCT CAGTTTGTAC TTCTTACTCA GAT T G CAT C A TTATTTGCAG TATATGTTGT 540 

85 CGGGTACATT GATATATGTA AATTACGGAA GATCATTTAT ATACACATGA TTTCTCTTGC 600 

ACTTTGTTTT GTTTTGATGT TTGGGAACTC AATGTTATTA ACTTCTTATT ATGCTTCTTC 660 

TTTGGTAATT ATTTGGGGTA TTCTGGCAAT GAAACCACAT TTCCTGAAAA TAAATGTATC 72 0 
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TGAACTTAGT TTATGGGTTA 
ATACTTGACA TCTAAAATTT 
ATCAAAATTC TTTAGT TATA 
TGACTTTATG GAAAAAGAGA 
TCTTGTAGTG TTTGTTGCTA 
TAAACAACAG ACACATGTAA 
ATTGCAATTG TTAGCATATA 
GACACCACAC ATGTGTGTTA 
CTTTTGCAAA GTACATCCTG 
AGGTTCAGCA AATCTGCAAA 
AGAAGAACTT ATAGAATGGA 
CATGCCCACG ATGGCAAGTG 
TTATGAAGAC GCAGGCTTGA 
AGCAGCCGAA GAAGTGAAGC 
AGAGTCATGG TGTGTAAGAA 
AGAAGAT CCT GCCAATGCTG 
ACCTCACTTC ACC ACT GT AT 
ATGACTGCTA CATGACCTGC 
GCTAAGTCAT GTGTTGTTCA 
AACGTTTTAT TTGGTCAATT 
CAATTGGTTA CTATTTCAAT 
TACTTGACTT TAATATTTGT 
GGGTTGTGAC AAGGATGACA 
TATAGTGTAA GAACTATTAA 
TGGACATTTC AGTGATTGTA 
ACAGTAGATG GGGCAGACAT 
CTTGTGCGCT TTTTGTTCTC 
CCAAACTCTT GGACCTTGTG 
GTGTCTCTTT CTCTCTCTCT 
AATAAGTACT GTTTACTCAT 
ATTAATGGTA ACTGTATTTT 
CTTTAAACCA CTTTAAAGTT 
ACAACCCCAA ATATAGTGCA 
TGGAACAGTA GACTGTAGTA 
TGACTAATTT TGCTGTCAAA 
CTTTTAAGAT TGCCTGTCTT 
TCTAAAAACC ATCATTTCAG 
TTCTTCCTAT TTATTTTTAT 
ATTTTTGTTT CTTAGAAGTT 
ATAGCTCTGA GAAAAGGTTT 
AGACTACACA TTTAATTATA 
TGGATTGTCC TTCAGACCTT 
GCTGTTCCCT TTCTACCTTC 
CAGCTTGCTG ACATAAGTCA 
CCCCCAGTCT TGTGCCAGCG 
CAGCCCAGGA GAGGGACTCT 
CTGGTTGACT GTTTTTATTT 
TTGATTTGTG GATTAAAAGC 
CGGTGGACAC TTGAGGCTGA 
TGCTTATCTG TGATTGTTGC 
ATTTTTAAAA ATTATACTTT 
TCCAAAGAAG TTCACATGTA 
CTATTATAAC TGCTTCATTT 
GAAGGATCCT TTTGTAGCAG 
TAGGGGAGCC AGTTTGGAGC 
TCGCAGCCCA AGCACTGTGG 
TTCCATAGGC GTACAAAACA 
AATATTTTTG CTTTAGTATG 
TTGCTACAAC ATTTTCGAAA 
AAAAATGCTT GGCAAAAAAA 
GAAAGTATGT ATCAGGAATA 
ATGCCAGTTG TTTACATGTA 
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TTCAAGGATG 
TTGGTATTGC 
AGGATTTTGA 
CTCCACTGAG 
TTGTTAGAAA 
GAAAACACCA 
CAGCCCTTGG 
TGGCATCACT 
GTGCTATTGT 
CCCAGTGGAA 
TCAAATATAG 
TTAAGCTCTC 
GAGCCAGAAC 
GAGAACTGAT 
GATCCAAGCC 
GGAAAACTCC 
TCCAGAACAG 
TGCCTACGGA 
TATCCCAAAA 
TGAATGTCAT 
GCACCCTTTA 
GCTAAAGTGA 
TGAAAATACA 
TGCCCCTTGC 
AGTTCTTCGG 
GGAGTGTTTG 
TGTTCTCTTG 
GTTAGGAAAT 
CTTGCTCTCT 
TTAGTTGCTT 
TCTCATTTTT 
TTTTCATGTT 
TCTAGAAACT 
CATGGTAATT 
AATGTAAAGA 
TAATAAGACA 
TATAAGGAAT 
TTTGAAAAAT 
AATTTGTGTG 
TAGGGTTTTA 
CAGCTTCTCT 
AGTCCTCAGG 
TTACCAGAGC 
GCTGCAAAGG 
CCTAGAGCCG 
GGCAGCGTTC 
CTTAGGCTTT 
AACATTTGAG 
GGATGGGAGT 
TCACCTGAGT 
TACATTTATT 
ATAAGTAGAA 
GCTGGGAACC 
TGTTTATGAA 
AGAGGCCTGA 
AGCATCCACA 
GTATTAAAGC 
AGGAAAGTAA 
ACAAAGTTGG 
ATATAGTGTT 
AAGTGATATT 
CTATATATGT 



TTTTTGGTTA 
AGATGACGCT 
TACTTTATTG 
ATACACAAAG 
GATTATTAGT 
GTTTGATCAT 
TATTTTAATT 
GATCTGCTCA 
GTTTGCTATA 
TATTGTAGGG 
TACTAAACCA 
TGCACTTCGG 
AAAAATAGTA 
AAAGTTAAAA 
TGGTTGCAGT 
CTTATGTAAC 
TGTTTACAAA 
GAACTACATC 
ACTTTTATAG 
TCTAATTATA 
AAATTTGCTA 
GCAAAGCTAC 
GGACAATTCT 
TTCTTTTTTC 
TCATGTCAGC 
CTATATAAAA 
TTAATGAAGC 
TCCCTTAACT 
CTCTTCTCCT 
AT CAAGTACT 
AGCATTATTC 
TAATTATAGT 
AATGTATATT 
TTTCTTTTAC 
ATAATGATAA 
AAGCCTTAAG 
AAGTATATTT 
TTCTACACCT 
AAATGAGATT 
AATTCTAAGC 
TTCTTAACCA 
CATGGTTTCT 
CCAAGGGCAG 
CTGAGGAGTG 
CAGCTCCCAG 
TTCAGATTTG 
TGCTAGTTTT 
CGATGATGCA 
TGACATGAGC 
GTGGCTGATT 
TTATATTTTT 
ATTCTGTATA 
ATTAAAAGTA 
TGTAACCCCC 
AGGTCCCTGC 
CCTTTGATGG 
TCAGTGTTTT 
GGATGGGCAA 
GGCTGTATTT 
AAAATAGGCC 
GCATAGGAGT 
TAAATTAAAA 



TTTGGAACTG 
CATATTGGCA 
TATACCTGTG 
ACATTATTGC 
GATATGTGGG 
GGAGAGCTGG 
ATGAGACTAA 
AGACAGCTAT 
TTAGCAGCAA 
GAGTTCAGCA 
GATGCAGTGT 
CCCATTGTGA 
TACTCAATGT 
GTGAACTATT 
ATGCCTGAAA 
CTCTTGGTGA 
GTCCTAGAAG 
TGTAATGGTT 
GTAACTGTTT 
AAAATGACTT 
TGCAAATGAG 
CTGTATAAAG 
GACAATGTAG 
TGCCTCTTGC 
CCCTGTCATC 
CTATCTGTTT 
TTTTCCTGCC 
TCCAGCCATA 
CTTCCCCATA 
TATTCTTGGT 
AAATGTTTAT 
TTTAAGAAAA 
TGATTAGACA 
TATTAAGATA 
ATGGAGTTTT 
CCTTATGTTA 
CGTCCTCCTC 
TCTTTGAATT 
CTTCAAAACG 
AAAGCGTGAC 
CAGGCAGATT 
GGTGCCCACT 
GCCTGGTCCC 
TGCCCTCAGA 
GGATGCTCCT 
TGGCCACTGT 
AGAAAATAGG 
CAACAGTCCA 
AGGGAGAGGG 
GTGTACATCC 
CTCACCCCCA 
GGAAAAAAGC 
ATATAAATTA 
AGCAAAATAT 
TATGCAGCCG 
CAATGCAGAT 
GCATATTGTT 
AGAAGCGATC 
CTTTAAAAAG 
AGTGATATTA 
ATTGTATTTT 
AAAATCATGA 



T CAT AC T T AA 780 

ACTTACTAAC 840 

CAGCGGAGTT 900 

TTCCAGTTGT 960 

GTGTCTTAGC 102 0 

TTTACCATGC 10 80 

AACTCTTCTT 1140 

TTGGATGGCT 12 00 

TGTCAATACA 12 60 

ATTTGCCCCA 13 20 

TTGCGGGTGC 13 80 

ATCATCCACA 1440 

ATAGTCGGAA 1500 

ACATTCTAGA 1560 

TTTGGGATGT 162 0 

AGGATTCCAA 1680 

TTGTAAAAGA 1740 

TTAATGTTTT 180 0 

T CAAAT AG AA 1860 

ACACCTTTAT 192 0 

TATATGCTTG 1980 

AAAACACAGT 2040 

GGGCTGATTT 210 0 

TCTTGTCTTT 2160 

AACTTGAGTT 222 0 

GTTTTACTTC 22 80 

CATTATTAAT 2340 

TGGCATTATC 2400 

TTTTCTGTCA 24 6 0 

TTTAAAAAAA 252 0 

ATTTTAATAC 25 8 0 

ACT ATTT TGA 2 640 

TCATTTATAG 270 0 

CAAT AAAACA 2 760 

TTATATTTTA 2 820 

TAATTTTGGT 2 880 

TTTAGTTTTT 2 940 

CCTTGTATGA 3 00 0 

ATGAAACCTC 3 0 60 

TATGGCTGAC 312 0 

AACCTCATTG 3180 

CCTGGAAGCC 3240 

GGGGAAGCAG 33 00 

GAAGCACCGC 33 60 

TCCCTGGAGG 3 42 0 

TTCTCATTTG 3 480 

GAAGCAG CCC 3 540 

GGAAAATGGG 3 600 

AGGTGCGCGC 3 6 60 

AGCAGTTACA 3 72 0 

GTAATTTCCT 3 780 

ATTAAAAATA 3 840 

GCTTTTTCCA 3 900 

GGCTATATAT 3 960 

TGGCCACAGC 4020 

TGGTAGCAGG 40 80 

AGCATTTACA 4140 

AAAATAGCTA 420 0 

ATAAGCCTCT 42 60 

ATGAGAAAAT 432 0 

TATGAATTTT 43 80 
GAAATG 
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Seq ID NO: 4 99 Protein sequence 
Protein Accession #: BAA74900.1 



70 



75 



80 



PLVINTLKRF 
ACFYVAVIFI 
SYPFLVLQML 
GYIDICKIjRK 
ELSIiWVIQGC 
DFMEKETPLR 
LQLIiAYTALG 
GSANLQTQWN 
YEDAGLRART 
ED P ANAGKTP 



11 
I 

NLYPE VILAS 
LNGLMMALFF 
IiVTHILRATK 
IIYIHMISLA 
PWLFGTVILK 
YTKTLLLPW 
ILIMRIiKLFL 
IVGEFSNLPQ 
KIVYSMYSRK 
LCNLLVKDSK 



21 
f 

WYRIYTKIMD 
IYGTYLSGSR 
LYRGSLIALC 
LCFVLMFGNS 
YLTSKIFGIA 
LWFVAIVRK 
TPHMCVMASL 
EELIEWIKYS 
AAEEVKREL I 
PHFTTVFQNS 



31 
I 

LIGIQTKICW 
LGGLVTVLCF 
ISNVFFMLPW 
MLLTSYYASS 
DDAHIGNLLT 
IISDMWGVLA 
ICSRQLFGWL 
TKPDAVFAGA 
KLKVNY Y I LE 
VYKVLEWKE 



41 
I 

TVTRGEGLSP 
FFNHGECTRV 
QFAQFVLLTQ 
LVIIWGILAM 
SKFFSYKDFD 
KQQTHVRKHQ 
FCKVHPGAIV 
MPTMASVKLS 
ESWCVRRSKP 



51 
I 

IESCEGLGDP 60 

MWTPPLRESF 12 0 

IASLFAVYW 180 

KPHFLKINVS 240 

TLIiYTCAAEF 3 00 

FDHGELVYHA 3 60 

FAILAAMSIQ 42 0 

AIiRPIVNHPH 480 

GCSMPEIWDV 540 



Seq ID NO: 50 0 DNA sequence 

Nucleic Acid Accession #: NM_001276.1 

Coding sequence: 127.. 1278 



„ 1 11 21 31 41 51 

85 ] | | | | | 

AGTGGAGTGG GACAGGTATA TAAAGGAAGT ACAGGGCCTG GGGAAGAGGC CCTGTCTAGG 
TAGCTGGCAC CAGGAGCCGT GGGCAAGGGA AGAGGCCACA CCCTGCCCTG CTCTGCTGCA 
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GCCAGAATGG GTGTGAAGGC 
TGCTCTGCAT ACAAACTGGT 
GGGAGCTGCT TCCCAGATGC 
GCCAATATAA GCAACGATCA 
ATGCTCAACA CACTCAAGAA 
TGGAACTTTG GGTCTCAAAG 
TTCATCAAGT CAGTACCGCC 
TGGCTCTACC CTGGACGGAG 
GCCGAATTTA TAAAGGAAGC 
TCTGCGGGGA AGGTCACCAT 
GATTTCATTA GCATCATGAC 
CACAGTCCCC TGTTCCGAGG 
TATGCTGTGG GGTACATGTT 
CCCACCTTCG GGAGGAGCTT 
TCAGGACCGG GAATTCCAGG 
ATCTGTGACT TCCTCCGCGG 
GCCACCAAGG GCAACCAGTG 
CAGTACCTGA AGGATAGGCA 
TTCCAGGGCT CCTTCTGCGG 
GCACTCGCTG CAACGTAGCC 
CCCCCTCTGG CTCCAGCTGG 
GCCTCAGTCT CCCTCCCTTG 
GCCCTGGTGG GCAGAGAGGT 
GACTCGGGAT TAGTACACAC 
TGGCAAGGGA ATTTCTTCAA 
TGGCAAGCTC TATCACCAAG 
TACCCCCTGC AAAGCCAGCT 
ACTTCCCCTT CCTAATTCCA 
CGCTTTGCTT TGGTCTATCT 
TCTTCTGGGT TCCTTCCTCT 
ATGTT 
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GTCTCAAACA 
CTGCTACTAC 
CCTTGACCGC 
CATCGACACC 
CAGGAACCCC 
ATTTTCCAAG 
ATTCCTGCGC 
AGACAAACAG 
CCAGCCAGGG 
TGACAGCAGC 
CTACGATTTT 
TCAGGAGGAT 
GAGGCTGGGG 
CACTCTGGCT 
CCGGTTCACC 
AGCCACAGTC 
GGTAGGATAC 
GCTGGCAGGC 
CCAGGATCTG 
CTCTGTTCTG 
CCGGGAGCCT 
GGGCCTATGC 
AGGGATGGGG 
TTGTTGATGA 
CTCCCTGCCC 
GAGCCAAACA 
TGAAACCTTC 
CAGCTGCTCA 
TTGAGCGCCC 
GAGCCTTGGG 



GGCTTTGTGG 
ACCAGCTGGT 
TTCCTCTGTA 
TGGGAGTGGA 
AACCTGAAGA 
ATAGCCTCCA 
ACCCATGGCT 
CATTTTACCA 
AAAAAGCAGC 
TATGACATTG 
CATGGAGCCT 
GCAAGTCCTG 
GCTCCTGCCA 
TCTTCTGAGA 
AAGGAGGCAG 
CATAGAACCC 
GACGACCAGG 
GCCATGGTAT 
CGCTTCCCTC 
CACACAGCAC 
GATCACCTGC 
AGAGGTCCAC 
CTGTGGGGAT 
TTAATGGAAA 
CCTAGCCCTC 
TCCTACAAGA 
ACTTAGGAAC 
ATAAAGTACA 
ACTAGACCCA 
ACCCCTGAGC 



TCCTGGTGCT 
CCCAGTACCG 
CCCACATCAT 
ATGATGTGAC 
CTCTCTTGTC 
ACACCCAGAG 
TTGATGGGCT 
CCCTAATCAA 
TCCTGCTCAG 
CCAAGATATC 
GGCGTGGGAC 
ACAGATTCAG 
GTAAGCTGGT 
CTGGTGTTGG 
GGACCCTTGC 
TCGGCCAGCA 
AAAGCGTCAA 
GGGCCCTGGA 
TCACCAATGC 
GGGGGCCAAG 
CCTGCTGAGT 
AACACACAGA 
AGTGAGGCAT 
TGTTTACAGA 
CTTAT CAAAG 
CACAGTGACC 
GTAATCGTGT 
AGAGTTTAAC 
CTGGACTCAC 
TTGCAGAGAT 



GCTCCAGTGC 180 

GGAAGGCGAT 240 

CTACAGCTTT 3 0 0 

GCTCTACGGC 3 60 

TGTCGGAGGA 420 

TCG CCGG ACT 480 

GGACCTTGCC 540 

GGAAATGAAG 600 

CGCAGCACTG 660 

CCAACACCTG 720 

CACAGGCCAT 780 

CAACACTGAC 84 0 

GATGGGCATC 900 

AGCCCCAATC 960 

CTACTATGAG 102 0 

GGTCCCCTAT 1080 

AAG CAAGGTG 114,0 

CCTGGATGAC 1200 

CATCAAGGAT 12 60 

GATGCCCCGT 132 0 

CCCAGGCTGA 13 80 

TTTGAGCTCA 1440 

CGCAATGTAA 1500 

TCCCCAAGCC 15 60 

GACACCATTT 162 0 

ATACTAATTA 168 0 

CCCCTATCCT 1740 

AGTGTGTTGG 1800 

CTCCCCCATC 1860 

GAAGGCCGCC 1920 



35 



Seq ID NO: 501 Protein sequence 
Protein Accession #: NP 001267.1 



40 



45 



50 



55 



60 



65 



MGVKASQTGF 
ISNDHIDTWE 
KSVPPFLRTH 
GKVTIDSSYD 
VGYMLRLGAP 
DFLRGATVHR 
GSFCGQDLRF 



11 
I 

WLVLLQCCS 
WNDVTLYGML 
GFDGLDLAWL 
IAKISQHLDF 
ASKLVMGIPT 
TLGQQVPYAT 
PLTNAIKDAL 



21 



AYKLVCYYTS 
NTLKNRNPNL 
YPGRRDKQHF 
ISIMTYDFHG 
FGRSFTLASS 
KGNQWVGYDD 
AAT 



31 
I 

WSQYREGDGS 
KTLLSVGGWN 
TTLIKEMKAE 
AWRGTTGHHS 
ETGVGAPISG 
QESVKSKVQY 



41 
I 

CFPDALDRFL 
FGSQRFSKIA 
FIKEAQPGKK 
PLFRGQEDAS 
PGIPGRFTKE 
LKDRQLAGAM 



51 
I 

CTHIIYSFAN 
SNTQSRRTFI 
QLLLSAALSA 
PDRFSNTDYA 
AGTLAYYEIC 
VWALDLDDFQ 



Seq ID NO: 502 DNA sequence 

Nucleic Acid Accession ft: NM_006474.1 

Coding sequence: 181.. 669 



GCTGCCTAGG 
TCCGGCCCCC 
TTCCCCCAGC 
ATGTGGAAGG 
GAAGGAGCCA 
GTTGCCATGC 
AAGTCTGGCT 
GAGGATCTGC 
GCCTCAAACG 
GTTGAGAAAG 
GCCATCGGTT 
TCGCCCTAAA 
TTCTGACTCT 
CGGGCCCATT 
TCACCAGATT 



11 

i 

GTCTGGAAAG 
CCACCGTCGC 
TCAGAATCTT 
TGTCAGCTCT 
GCACAGGCCA 
CAGGTGCCGA 
TGACAACTCT 
CAACTTCAGA 
TGGCCACCAG 
ATGGTTTGTC 
TCATTGGTGG 
GAGCTGAAGG 
GTGGCCCTGT 
CAGATTCCAC 
TGGTTCTTAA 



21 
I 

CTCGGGCACC 
GCTCCTCCAG 
GCTGCTCGGC 
GCTCTTCGTT 
GCCAGAAGAT 
AGATGATGTG 
GGTGGCAACA 
AAGCACAGTC 
TCACTCCACG 
AACAGTGACC 
AATCAT CGTT 
GTTACGCCCT 
CCCTGAGCTC 
GGTGACTTTC 
ACTTT 



31 

i 

CTCCCTCTCC 
GCTGGGCCTG 
CCCCAGGAGA 
TTGGGAAGCG 
GACACTGAGA 
GTGACTCCAG 
AGTGTCAACA 
CACGCGCAAG 
GAGAAAGTGG 
CTGGTTGGAA 
GTGGTTATGC 
GCTTGCCAAC 
GTGGGGAGAA 
CGTTTGCCAA 



41 

I 

GGGGCTCCTG 
TGGCCGCGGT 
GCAACAACTC 
CGTCGCTCTG 
CTACAGGTTT 
GAACCAGCGA 
GTGTAACAGG 
AACAAAGTCC 
ATGGAGACAC 
TCATAGTTGG 
GAAAAATGTC 
GTGCTTTAAA 
GATGACCCTG 
ATTAACCGAG 



51 
I 

CTCCCACCCC 
GCTTTTAATT 
AACGGGAACG 
GGTCCTGGCA 
GGAAGGCGGC 
AGACCGCTAT 
CATTCGCATC 
AAGCGCCACA 
ACAGACAACA 
GGT CTT ACTA 
GGGAAGGTAC 
AAAAGACCGT 
GGAACATTTG 
GAAAGACCTT 



60 
120 
180 
240 
300 
360 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 



70 



75 



Seq ID NO: 503 Protein sequence 
Protein Accession ft: NP 006465.1 



11 



21 



31 



51 



41 

I I I I I I 

MWKVSALLFV LGSASLWVLA EGASTGQPED DTETTGLEGG VAMPGAEDDV VTPGTSEDRY 

KSGLTTLVAT SVNSVTGIRI EDLPTSESTV HAQEQSPSAT ASNVATSHST EKVDGDTQTT 

VEKDGLSTVT LVGIIVGVLD AIGFIGGIIV WMRKMSGRY SP 



60 
120 



80 



85 



Seq ID NO: 504 DNA sequence 
Nucleic Acid Accession #: Eos 
Coding sequence: 62.. 8 95 



sequence 



1 
I 

CACTGCTCTG 
TATGATCATC 
CAAGGATGGA 
AGAAGCACGG 
TGAAGGCGGC 



11 

I 

AGAATTTGTG 
TTAATTTACT 
ATTTTTCATA 
TCTGGCAAAT 
CATCTCGCAA 



21 
I 

AGCAGCCCCT 
TATTTCTCTT 
ACTCCATATG 
ACAAGCTCAC 
CTTACAAGCA 



31 



AACAGGCTGT 
GCTATGGGAA 
GCTTGAACGA 
CTACGCAGAA 
GCTAGAGGCA 



41 
I 

TACTTCACTA 
GACACTCAAG 
GCAGCCGGTG 
GCTAAGGCGG 
GCCAGAAAAA 



51 



CAACTGACGA 60 

GATGGGGATT 120 

TGTACCACAG 180 

TGTGTGAATT 240 

TTGGATTTCA 300 



377 



WO 02/086443 

TGTCTGTGCT GCTGGATGGA 
GCCCAACTGT GGATTTGGAA 
TGAAAGATGG GATGCCTATT 
AGAT CCAAAG CAAATTTTTA 
CTGCTACTGG CACATTAGAG 
TGACCTTGAA GATGACCCAG 
TGATGT CCAT GGCTTTGTGG 
TACAGGAAAT GTCATGACCT 
CCAAATCAAA TATGTTGCAA 
TACTACTTCT ACTGGAAATA 
AAAAAAAGGA TGATCAAAAC 
CTCACTGTTA TTATTAACAT 
TAGGGAAAAT TGGAAAATAT 
ACTGCATAGA AATAACAAGC 
TTTGTGGTAT ATGTATATAT 
TCTATGTACA GTTTTGTATT 
TCATTGATTA TTCTACAAAA 
TGTTTTATGC ATTATTTAAG 
ATTGTTGCAA TAAATATCCT 



TGGCTAAGGG CAGAGTTGGA 
AAACTGGCAT TATTGATTAT 
GCTACAACCC ACACGCAAAG 
AATCTCCAGG CTTCCCAAAT 
TCAAGTATGG TCAGCGTATT 
GTTGCTTGGC TGATTATGTT 
GAAGATACTG TGGAGATGAG 
TGAAGTTTCT AAGTGATGCT 
TGGATCCTGT ATCCAAATCC 
AAAACTTTTT AGCTGGAAGA 
ACACAGTGTT TATGTTGGAA 
TTATTTATTA TTTTTCTAAA 
AGGAAACTTT AAACGAGAAA 
GTTAACATTT TCATATTTTT 
GTACCTATAT GTATTTGCAT 
ATACTTTTTA AATCTTGAAC 
ACATGATTTT AAACAGCTGT 
CCTGTCTCTA TTGTTGGAAT 
TGAACACACA AAAAAAAAAA 



TACCCCATTG TGAAGCCAGG 
GGAATCCGTC TCAATAGGAG 
GAGTGTGGTG GCGTCTTTAC 
GAGTACGAAG ATAACCAAAT 
CACCTGAGTT TTTTAGATTT 
GAAATATATG ACAGTTACGA 
CTTCCAGATG ACAT CATCAG 
TCAGTGACAG CTGGAGGTTT 
AGTCAAGGAA AAAATACAAG 
TTTAGCCACT TATAAAAAAA 
TCTTTTGGAA CTCCTTTGAT 
TGTGAAAGCA ATACATAATT 
ATGAAACCTC TCATAATCCC 
TTCTTTCAGT CATTTTTCTA 
TTGAAATTTT GGAATCCTGC 
TTTATAAACA TTTTCTGAAA 
AAAATATTCT ATGATATGAA 
TTCAGGTCAT TTTCATAAAT 
AA 



Seq ID NO: 505 Protein sequence 
Protein Accession # : Eos sequence 



1 11 21 31 41 51 

I I I I I I 

MIILIYLFLL LWEDTQGWGF KDGIFHNSIW LERAAGVYHR EARSGKYKLT YAEAKAVCEF 

EGGHLATYKQ LEAARKIGFH VCAAGWMAKG RVGYPIVKPG PNCGFGKTGI IDYGIRLNRS 

ERWDAYCYNP HAKECGGVFT DPKQIFKSPG FPNEYEDNQI CYWHIRLKYG QRIHLSFLDF 

DLEDDPGCLA DYVEIYDSYD DVHGFVGRYC GDELPDDIIS TGNVMTLKFL SDASVTAGGF 

QIKYVAMDPV SKSSQGKNTS TTSTGNKNFL AGRFSHL 



Seq ID NO: 50 6 DNA sequence 

Nucleic Acid Accession #t NM_007115.1 

Coding sequence: 69.. 902 



1 11 21 

I I I 

GAATTCGCAC TGCTCTGAGA ATTTGTGAGC 

CTGACGATAT GATCATCTTA ATTTACTTAT 

GGGGATTCAA GGATGGAATT TTTCATAACT 

ACCACAGAGA AGCACGGTCT GGCAAATACA 

GTGAATTTGA AGGCGGCCAT CTCGCAACTT 

GATTTCATGT CTGTGCTGCT GGATGGATGG 

AGCCAGGGCC CAACTGATGA TTTGGAAAAA 

ATAGGAGTGA AAGATGGGAT GCCTATTGCT 

TCTTTACAGA TCCAAAGCGA ATTTTTAAAT 

ACCAAATCTG CTACTGGCAC ATTAGACTCA 

TAGATTTTGA CCTTGAAGAT GACCCAGGTT 

GTTACGATGA TGTCCATGGC TTTGTGGGAA 

TCATCAGTAC AGGAAATGTC ATGACCTTGA 

GAGGTTTCCA AATCAAATAT GTTGCAATGG 

ATACAAGTAC TACTTCTACT GGAAATAAAA 

AAAAAAAAAA AAGGATGATC AAAACACACA 

TTGAT CTCAC TGTTATTATT AACATTTATT 

TAATTTAGGG AAAATTGGAA AATATAGGAA 

ATCCCACTGC ATAGAAATAA CAAGCGTTAA 

TTGTATTTGT GGTATATGTA TATATGTACC 

u , CCTGCTCTAT GTACAGTTTT GTATTATACT 

TGAAATCATT GATTATT CTA CAAAAACATG 

ATGAATGTTT TATGCATTAT TTAAGCCTGT 

TAAATATTGT TGCAATAAAT ATCCTTCGGA 



31 41 51 

I. 1 I 

AGCCCCTAAC AGGCTGTTAC TTCACTACAA 

TTCTCTTGCT ATGGGAAGAC ACTCAAGGAT 

CCATATGGCT TGAACGAGCA GCCGGTGTGT 

AGCTCACCTA CGCAGAAGCT AAGGCGGTGT 

ACAAGCAGCT AGAGGCAGCC AGAAAAATTG 

CTAAGGGCAG AGTTGGATAC CCCATTGTGA 

CTGGCATTAT TGATTATGGA ATCCGTCTCA 

ACAACCCACA CGCAAAGGAG TGTGGTGGCG 

CTCCAGGCTT CCCAAATGAG TACGAAGATA 

AGTATGGTCA GCGTATTCAC CTGAGTTTTT 

GCTTGGCTGA TTATGTTGAA ATATATGACA 

GATACTGTGG AGATGAGCTT CCAGATGACA 

AGTTTCTAAG TGATGCTTCA GTGACAGCTG 

ATCCTGTATC CAAATCCAGT CAAGGAAAAA 

ACTTTTTAGC TGGAAGATTT AGCCACTTAT 

GTGTTTATGT TGGAATCTTT TGGAACTCCT 

TATTATTTTT CTAAATGTGA AAGAAATACA 

ACTTTAAACG AGAAAATGAA ACCTCTCATA 

CATTTTCATA TTTTTTTCTT TCAGTCATTT 

TATATGTATT TGCATTTGAA ATTTTGGAAT 

TTTTAAATCT TGAACTTTAT GAACATTTTC 

ATTTTAAACA GCTGTAAAAT ATTCTATGAT 

CTCTATTGTT GGAATTTCAG GTCATTTTCA 

ATTC 



Seq ID NO: 507 Protein sequence 
Protein Accession #: NP 009046.1 



1 11 21 

I I I 

MIILIYLFLL LWEDTQGWGF KDGIFHNSIW 

EGGHLATYKQ LEAARKIGFH VCAAGWMAKG 

ERWDAYCYNP HAKECGGVFT DPKRIFKSPG 

DLEDDPGCLA DYVEIYDSYD DVHGFVGRYC 

QIKYVAMDPV SKSSQGKNTS TTSTGNKNFL 



31 41 51 

I I I 

LERAAGVYHR EARSGKYKLT YAEAKAVCEF 

RVGYPIVKPG PNXXFGKTGI IDYGIRLNRS 

FPNEYEDNQI CYWHIRLKYG QRIHLSFLDF 

GDELPDDIIS TGNVMTLKFL SDASVTAGGF 

AGRFSHL 



Seq ID NO: 508 DNA sequence 

Nucleic Acid Accession #: NM_001044.1 

Coding sequence: 129.. 1991 

1 11 21 31 41 51 

I I I I I I 

ACCGCTCCGG AGCGGGAGGG GAGGCTTCGC GGAACGCTCT CGGCGCCAGG ACTCGCGTGC 

AAAGCCCAGG CCCGGGCGGC CAGACCAAGA GGGAAGAAGC ACAGAATTCC TCAACTCCCA 

GTGTGCCCAT GAGTAAGAGC AAATGCTCCG TGGGACTCAT GTCTTCCGTG GTGGCCCCGG 

CTAAGGAGCC CAATGCCGTG GGCCCGAAGG AGGTGGAGCT CATCCTTGTC AAGGAGCAGA 

ACGGAGTGCA GCTCACCAGC TCCACCCTCA CCAACCCGCG GCAGAGCCCC GTGGAGGCCC 

AGGATCGGGA GACCTGGGGC AAGAAGATCG ACTTTCTCCT GTCCGTCATT GGCTTTGCTG 

TGGACCTGGC CAACGTCTGG CGGTTCCCCT ACCTGTGCTA CAAAAATGGT GGCGGTGCCT 



378 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



WO 02/086443 

TCCTGGTCCC CTACCTGCTC 
TGGCCCTCGG CCAGTTCAAC 
TGAAAGGTGT GGGCTTCACG 
TCATCATCGC CTGGGCGCTG 
TCCACTGCAA CAACTCCTGG 
GTGGAGACAG CTCGGGCCTC 
AACGTGGCGT GCTGCACCTC 
GGCAGCT CAC AGCCTGCCTG 
GCGTGAAGAC CTCAGGGAAG 
CTGCCCTGCT CCTGCGTGGG 
TGAGCGTTGA CTTCTACCGG 
TGTGCTTCTC CCTGGGCGTG 
TCACCAACAA CTGCTACAGG 
TCTCCTCCGG CTTCGTCGTC 
CCATCGGGGA CGTGGCCAAG 
TCGCCACGCT CCCTCTGTCC 
TGGGT AT CG A CAGCGCCATG 
TCCAGCTGCT GCACAGACAC 
TCCTGTCCCT GTTCTGCGTC 
TTGCAGCCGG CACGTCCATC 
TCTATGGTGT TGGGCAGTTC 
TGTACTGGCG GCTGTGCTGG 
TCAGCATTGT GACCTTCAGA 
ACGCGCTGGG CTGGGTCATC 
ACAAGTTCTG CAGCCTGCCT 
AGAAGGACCG TGAGCTGGTG 
TCAAGGTGTA GAGGGAGCAG 
ACGAACAAAC CAAGGAAATC 
CTCTACTGAA AACACAAACA 
TCCGTGCCGG GAGCGCACCT 
GCAGCGAGGT CCACCCCGTT 
TCTGTGTGAG GCTCCCTCCC 
CACTGTGTTC TCAGGCGGGG 
CTCACAGTAG CTTCCTAGAC 
GGTTTAGCTG TGCAGAAGGT 
GATGCGTGGC TCCCAGCAGA 
GTCTGTTCAG AGGCAT TGGA 
ATGTTCTTGC AGCAGAGAGA 
GGCAGCCTGT GGGTCCTTGT 
GACGCATGCA GGGCCCCCAC 
AGGAGCATGT CCTATCCCTG 
AACGCATGCA GGGCCCCCAC 
TGGAGCGTGT ACTACCCCAG 
GACCGGACGC ATGCAGGGCC 
CCCACAGGAG CGTGTACTAC 
CCCAGGACGC ATGCAGGGCC 
TGAGCCGTGA CCTCCAGGAA 
CATCAATAAC AACAGTTTTT 
ATCAAAACAA ATTCAAGAAT 
TTTACAAGAA TAATTAGCAA 
CACACTGCCC TCTGCCACTG 
TCGGTGGGCC TGCCTACGTG 
TCCCCTGCAA GTGGACGTGG 
GCCTGTGAAC TGCCAGGCAG 
GGGAGGGACA CAGAGGACGG 
GCGGCTTCCC CATTGCCTTC 
GTTGTTGAAG ACAGCACAGA 
AGCAACCCAG GTGTTGTCCG 
TAAGCACAAT AAAAGACATC 



PCT/US02/12476 



TTCATGGTCA 
AGGGAAGGGG 
GTCATCCTCA 
CACTATCTCT 
AACAGCCCCA 
AACGACACTT 
CACCAGAGCC 
GTGCTGGTCA 
GTGGTATGGA 
GTCACCCTCC 
CTCTGCGAGG 
GGGTTCGGGG 
GACGCGATTG 
TTCTCCTTCC 
GACGGGCCAG 
TCAGCCTGGG 
GGTGGTATGG 
CGTGAGCTCT 
ACCAACGGTG 
CTCTTTGGAG 
AGCGACGACA 
AAGCTGGTCA 
CCCCCCCACT 
GCCACATCCT 
GGGTCCTTTC 
GACAGAGGGG 
AGACGAAGAC 
TAAGTTTCGA 
ACAAAGCAGA 
CGCCGTGTCT 
GTTGTCCCTG 
TCCCTGCTCC 
AT CACGAT CC 
CATTTACTTT 
GAAATGGAGG 
GGCCGTAAAT 
GGATGGGGGT 
AATAAAACTC 
GGTGTAGGGA 
AGGAGCGTGT 
GACGCATGCA 
AGGAGCGTGT 
GACGCATGCA 
CCCACAGGAG 
CCCAGGATGC 
CCCATGCAGG 
GGGACCCCAC 
ATGTTTGCGA 
GCAGT AT CCG 
TACTGAGTGA 
ACAGGAAAGT 
CTGCCCGAGG 
GCTCCAGGGA 
CTGCAGTTAG 
CTTCCCCATC 
TGGGGAGGGA 
GAGCGGCTTC 
TGTCTGTTGA 
CACAATGGAA 



TTGCTGGGAT 
CCGCTGGTGT 
T CTCACTGT A 
TCTCCTCCTT 
ACTGCTCGGA 
TTGGGACCAC 
ATGGCAT CGA 
TCGTGCTGCT 
TCACAGCCAC 
CTGGAGCCAT 
CGTCTGTTTG 
TGCTGATCGC 
TCACCACCTC 
TGGGGTACAT 
GGCTGATCTT 
CCGTGGT CTT 
AGT CAGTGAT 
TCACGCTCTT 
GCATCTACGT 
TGCTCATCGA 
T CC AGCAGAT 
GCCCCTGCTT 
ACGGAGCCTA 
CCATGGCCAT 
GAGAGAAACT 
AGGTGCGCCA 
CCCAGGAAGT 
GAGAAAGGAG 
AGACTCCTCT 
TGTGTTGCTG 
CAGGGCAGAA 
CTGCTCCCGG 
TTGTAGACGC 
GCCCATATTA 
AAACCACAAA 
TGAGCGTTCA 
CCTGGTATGT 
CTTGAAACCA 
ACGGCCTGAG 
CCTATCCCCG 
GGGCCCCCAC 
ACTACCCCAG 
GGGCCCCCAC 
CGTGTACTAC 
ATGCAGGGCC 
CAGCCTGCAG 
TGGAATTTTA 
ATGGCTTTTT 
CGAGCCTGCT 
AGGATGTTGG 
GGATGCCATA 
GCAGGGGCCG 
CTGGAGTGTA 
CACAGAGGAT 
GCCTTCTGGC 
CACAGAGGAC 
CCCATCGCCT 
CCAATCTCTA 
AAAAAAAAAG 



GCCACTTTTC 
CTGGAAGATC 
TGTCGGCTTC 
CACCACGGAG 
TGCCCATCCT 
ACCTGCTGCC 
CGACCTGGGG 
CTACTTCAGC 
CATGCCATAC 
AGACGGCATC 
GATTGACGCG 
CTTCTCCAGC 
CATCAACTCC 
GGCACAGAAG 
CATCATCTAC 
CTTCATCATG 
CACCGGGCTC 
CATCGTCCTG 
CTTCACGCTC 
AGCCATCGGA 
GACCGGGCAG 
TCTCCTGTTC 
CATCTTCCCC 
GGTGCCCATC 
GGCCTACGCC 
GTTCACGCTC 
CATCCTGCAA 
GGCAACTTCT 
CTTCTGACTG 
TAATAACGAC 
AAACGTCTAA 
CTCTGAGGCT 
ACCTGCTGAG 
AAAAGCCAAG 
TTCATGCAAA 
GTTGACACAT 
CTCACCAGGA 
GCTCAGGCTA 
AGGAGCGTGT 
GACGCATGCA 
AGGAGCGTGT 
GACGCATGCA 
AGGAGCGTGT 
CCCAGGACGC 
CCCACAGGAG 
ACCAACACTC 
TTTCTCTCAG 
AAAATCATAT 
TGCTGATATT 
CCAAAAGCTG 
GTTTGAATTC 
TGCAGGGCCA 
ATGCTCGGTG 
GGCTTCCCCA 
CGCTGCAGTC 
AGTTTCCCCA 
TCTGGGGAGG 
TTCAGCATCG 
GAATTC 



TACATGGAGC 480 

TGCCCCATAC 540 

TTCTACAACG 600 

CTCCCCTGGA 660 

GGTGACTCCA 720 

GAGTACTTTG 780 

CCTCCGCGGT 840 

CTCTGGAAGG 900 

GTGGTCCTCA 960 

AG AG CAT AC C 102 0 

GCCACCCAGG 10 80 

TACAACAAGT 1140 

CTGACGAGCT 1200 

CACAGTGTGC 1260 

CCGGAAGCCA 1320 

CTGCTCACCC 13 80 

ATCGATGAGT 1440 

GCGACCTTCC 1500 

CTGGACCATT 1560 

GTGGCCTGGT 162 0 

CGGCCCAGCC 1680 

GTGGTCGTGG 1740 

GACTGGGCCA 1800 

TATGCGGCCT 1860 

ATTGCACCCG 1920 

CGCCACTGGC 1980 

TGGGAGAGAC 2 040 

ACTCTTCAAC 2100 

TTTACACCTT 2160 

GTAGATCTGT 2220 

CTTCATGCTG 2280 

GCCCCAGGGG 2 340 

AATCCCCGTG 2400 

TGTCCTGCTT 2460 

GTCCTTTCCC 2 52 0 

TGCACACACA 2 580 

AATTCTGTTT 2640 

CTGCCACTCA 270 0 

CCTATCCCCG 2 760 

GGGCCCCCAC 2 82 0 

ACTACCCCAG 2880 

GGGCCCCCAC 2 940 

CCTATCCCCG 300 0 

ATGCAGGGCC 30 60 

CGTGTACTAC 3120 

TGCCTGGCCT 3180 

GTGCGTGCCA 3240 

TTACCTGTGA 3 3 00 

GCAGTTTTTG 33 60 

CTTTCCATGG 342 0 

ATGCCTCAAG 3 480 

GTCATGGCTG 3540 

GGAGCCGTCA 3 60 0 

TTGCCTTCTG 3 660 

AGCACAGAGA 3720 

TCGCCTTCTG 3 780 

GGCTCCGTGT 3 840 

TGTGGGTCCC 3 900 



Seq ID NO: 509 Protein sequence 
Protein Accession NP 001035.1 



65 



70 



75 



MSKSKCSVGL 
ETWGKKIDFL 
GQFNREGAAG 
NNSWNSPNCS 
TACLVLVIVL 
DFYRLCEASV 
GFWFSFLGY 
DSAMGGMESV 
GTSILFGVLI 
VTFRPPHYGA 
RELVDRGEVR 



11 
I 

MSSWAPAKE 
LSVIGFAVDL 
VWKICPILKG 
DAHPGDSSGD 
LYFSLWKGVK 
WIDAATQVCF 
MAQKHSVPIG 
ITGLIDEFQL 
EAIGVAWFYG 
Y I FPDWANAIj 
QFTLRHWL.KV 



21 



31 



PNAVGPKEVE 
ANVWRFPYLC 
VGFTVILISL 
SSGLNDTFGT 
TSGKWWITA 
SLGVGFGVLI 
DVAKDGPGIiI 
LHRHRELFTL 
VGQFSDDIQQ 
GWVIATSSMA 



LILVKEQNGV 
YKNGGGAFLV 
YVGFFYNVII 
TPAAEYFERG 
TMPYWLTAL 
AFSSYNKFTN 
FIIYPEAIAT 
FIVLATFLLS 
MTGQRPSLYW 
MVP I YAAYKF 



41 
I 

QLTSSTLTNP 
PYLLFMVIAG 
AWALHYLFSS 
VLHLHQSHGI 
LLRGVTLPGA 
NCYRDAIVTT 
LPLSSAWAW 
LFCVTNGGIY 
RLCWKLVSPC 
CSLPGSFREK 



51 

I 

RQSPVEAQDR 60 

MPLFYMELAL 120 

FTTELPWIHC 180 

DDLGPPRWQL 240 

IDGIRAYLSV 3 00 

SINSLTSFSS 3 60 

FFIMLLTLGI 42 0 

VFTLLDHFAA 480 

FLLFWWSI 540 

LAYAIAPEKD 600 



80 



85 



Seq ID NO: 510 DNA sequence 

Nucleic Acid Accession #: NM_001216.1 

Coding sequence: 43., 1422 



11 



21 31 41 51 

I 1 i 1 I I 

GCCCGTACAC ACCGTGTGCT GGGACACCCC ACAGTCAGCC GCATGGCTCC CCTGTGCCCC 60 

AGCCCCTGGC TCCCTCTGTT GATCCCGGCC CCTGCTCCAG GCCTCACTGT GCAACTGCTG 120 

CTGTCACTGC TGCTTCTGAT GCCTGTCCAT CCCCAGAGGT TGCCCCGGAT GCAGGAGGAT 180 

TCCCCCTTGG GAGGAGGCTC TTCTGGGGAA GATGACCCAC TGGGCGAGGA GGATCTGCCC 240 



379 



WO 02/086443 

AGTGAAGAGG ATTCACCCAG 
GAGGATCTAC CTGGAGAGGA 
TCCCTGAAGT TAGAGGATCT 
AATAATGCCC ACAGGGACAA 
"5 CCGCCCTGGC CCCGGGTGTC 

CGCCCCCAGC TCGCCGCCTT 
CTCCCGCCGC TCCCAGAACT 
CCTCCTGGGC TAGAGATGGC 
CTGCACTGGG GGGCTGCAGG 

10 CCTGCCGAGA TCCACGTGGT 

GGGCGCCCGG GAGGCCTGGC 
AGTGCCTATG AGCAGTTGCT 
CAGGTCCCAG GACTGGACAT 
TATGAGGGGT CTCTGACTAC 

15 CAGACAGTGA TGCTGAGTGC 

GGTGACTCTC GGCTACAGCT 
GAGGCCTCCT TCCCTGCTGG 
AATTCCTGCC TGGCTGCTGG 
ACCAGCGTCG CGTTCCTTGT 

20 GTGAGCTACC GCCCAGCAGA 

TGTGAGAAGC CAGCCAGAGG 
ATGCCACTTC CTTTTAACTG 



PCT/US02/12476 



AGAGGAGGAT 
GGATCTACCT 
ACCTACTGTT 
AGAAGGGGAT 
CCCAGCCTGC 
CTGCCCGGCC 
GCGCCTGCGC 
TCTGGGTCCC 
TCGTCCGGGC 
TCACCTCAGC 
CGTGTTGGCC 
GTCTCGCTTG 
ATCTGCACTC 
ACCGCCCTGT 
TAAGCAGCTC 
GAACTTCCGA 
AGTGGACAGC 
TGACATCCTA 
GCAGATGAGA 
GGTAGCCGAG 
CATCTGAGGG 
CCAAGAAATT 



CCACCCGGAG 
GAAGTTAAGC 
GAGGCTCCTG 
GACCAGAGTC 
GCGGGCCGCT 
CTGCGCCCCC 
AACAATGGCC 
GGGCGGGAGT 
TCGGAGCACA 
ACCGCCTTTG 
GCCTTTCTGG 
GAAGAAATCG 
CTGCCCTCTG 
GCCCAGGGTG 
CACACCCTCT 
GCGACGCAGC 
AGTCCTCGGG 
GCCCTGGTTT 
AGGCAGCACA 
ACTGGAGCCT 
GGAGCCGGTA 
TTTTAAAATA 



AGGAGGATCT 
CTAAATCAGA 
GAGATCCTCA 
ATTGGCGCTA 
TCCAGTCCCC 
TGGAACTCCT 
ACAGTGTGCA 
ACCGGGCTCT 
CTGTGGAAGG 
CCAGAGTTGA 
AGGAGGGCCC 
CTGAGGAAGG 
ACTTCAGCCG 
TCATCTGGAC 
CTGACACCCT 
CTTTGAATGG 
CTGCTGAGCC 
TTGGCCTCCT 
GAAGGGGAAC 
AGAGGCTGGA 
ACTGTCCTGT 
AAT AT T TATA 



ACCTGGAGAG 3 00 

AGAAGAGGGC 3 60 

AGAACCCCAG 42 0 

TGGAGGCGAC 480 

GGTGGAT AT C 540 

GGGCTTCCAG 60 0 

ACTGACCCTG 660 

GCAGCTGCAT 72 0 

CCACCGTTTC 780 

CGAGGCCTTG 840 

GGAAGAAAAC 900 

CTCAGAGACT 960 

CTACTTCCAA 102 0 

TGTGTTTAAC 10 80 

GTGGGGACCT 1140 

GCGAGTGATT 12 0 0 

AGTCCAGCTG 12 60 

TTTTGCTGTC 13 2 0 

CAAAGGGGGT 13 8 0 

TCTTGGAGAA 1440 

CCTGCTCATT 1500 
AT 



25 



30 



35 



Seq ID NO: 511 Protein sequence 
Protein Accession #: NP_001207.1 



I" 

MAPLCPSPWL 
GEEDLPSEED 
DPQEPQNNAH 
ELLGFQLPPL 
VEGHRFPAEI 
EEGSETQVPG 
DTLWGPGDSR 
GLLFAVTSVA 



11 

I 

PLLIPAPAPG 
SPREEDPPGE 
RDKEGDDQSH 
PELRLRNNGH 
HWHLSTAFA 
LD IS ALL PSD 
LQLNFRATQP 
FLVQMRRQHR 



21 
I 

LTVQLLLSLL 
EDLPGEEDLP 
WRYGGDPPWP 
SVQLTLPPGL 
RVDEALGRPG 
FSRYFQYEGS 
LNGRVIEASF 
RGTKGGVSYR 



31 
I 

LLMPVHPQRL 
GEEDLPEVKP 
RVSPACAGRF 
EMALGPGREY 
GLAVLAAFLE 
LTTPPCAQGV 
PAGVDSSPRA 
PAEVAETGA 



41 



PRMQEDSPLG 
KSEEEGSLKL 
QSPVDIRPQL 
RALQLHLHWG 
EGPEENSAYE 
IWTVFNQTVM 
AEPVQLNSCL 



51 

GGSSGEDDPL 60 

EDLPTVEAPG 12 0 

AAFCPALRPL 180 

AAGRPGSEHT 240 

QLLSRLEEIA 300 

LSAKQLHTLS 360 

AAGDILALVF 420 



40 



Seq ID NO: 512 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..3978 



45 



50 



55 



60 



65 



70 



75 



80 



85 



ATGGTGGGTG 

TTTGCAGAAA 

TTAGCACCCA 

ACGCCGGTGA 

TCGACATATG 

GTAGCAAGGG 

ACACGCGTGT 

CCGACAGTTC 

GTTGGCATTG 

GCCCTTGCCT 

TTGGTTTTTG 

CTCAATATAC 

CCAGCCACCA 

CCCACAGCTC 

GCCAAGCTCA 

ACAATGAATG 

TTTACCAACA 

TTTGTCCAAA 

ACATTATCCT 

ATTGCCATGT 

ATGGCTGAAG 

CCATCTTACA 

TTGACATGGG 

AGGCATTTAT 

GGAGCCACTG 

TTTGTGGTGA 

GCAGTGTTTG 

AAGGATGAAT 

GCCAAATACC 

CTCCTTGCAG 

ACTTTGGCCT 

CTCTTTGGAG 

CAGAAGGACC 

AACCTCTCTG 

CAGCTCTACC 

TTTGAGGAGT 

CTACAGTTCT 

AAGGGAACCC 

CTGCGAGGAT 

TTCAAGGAGA 

CTCTTCACTG 

CTGGGTCTCT 

ATGTGTGAGG 

ACTGCAAGCA 



11 
I 

AAGGACCCTA 

GATATGACCC 

ACCCGGTGGA 

TGGTGAAAGG 

ACTCATCTGA 

TGGGT CCTG A 

TGATGGACAT 

TCATTCACCA 

GACTGTGCAT 

GGGCCATCAA 

AAAACCTAGT 

TGTCAAGTGA 

TCCCGATCCT 

TCATCGGGAT 

ATTCAGCTTT 

AGTTTCTGAC 

CTATCCAAGA 

GTGGAAACTC 

GCCACATCCT 

TTAATGTAAT 

CGAATGTCTC 

TCACCCAACC 

AGCATGAAGC 

GCAAGAAACA 

GCCCAGAGGA 

GAAAGTTATG 

TTGGGAGAAT 

CTAGAAGGCT 

TGGGGAAGAT 

CTCTCCTAGG 

ACGTTTCACA 

AAAAGTATGA 

TGAGCAACCT 

GGGGGCAGAG 

TGCTGGACGA 

GCATTAAGAA 

TAGAGTCTTG 

ACAAGGAGTT 

TGCAGTTCAA 

GCCCTGCTGA 

TGTTCCTCTT 

GGT TGGACAA 

TCGGCGCGGT 

TGGTGT T CAT 



21 

] 

CCTTATCTCA 

CAGCCTGAAG 

TGATGCCGGG 

CTACCGGCAA 

CACCAATGCC 

GAAGGCCTCT 

CGTGGCCAAC 

AATCCTCCAG 

AGCCCTTTTT 

CTACCGCACG 

GTCCTTCAAG 

TAGCTATTCT 

AATGGTCTTT 

ATCAGTGTAT 

CCGAAGGTCA 

CTGCATCAGG 

TATAAGAAGG 

TGCCCTGGCC 

CCTGAGACGC 

GAAGTTTTCC 

TCTAAGGAGA 

AGAAGACCCA 

CAGCAGGAAA 

GAGGTCAGAG 

G C AAAGTG AC 

TCGTTATCCC 

CATCAGAGGA 

TCTTACTTGG 

CTTGGGAATA 

ACAGATGCAG 

GCAGGCATGG 

TCACCAAAGG 

CCCCTATGGA 

GCAGAGGATT 

CCCCCTGTCG 

GACG CTCAGG 

TGATGAAGTT 

AATGGAGGAG 

GGATCCTGAA 

GAGAGAGGAA 

CCTCCTGATG 

GGGCTCACGG 

GCTGGCAGAC 

GCTGGTGTTT 



31 
I 

GATCTGGACC 

ACCATGATCC 

CTACTCTCCT 

AGGCTGACCG 

AAAAGATTTC 

CTGAGCCACG 

ATCCTGTGCA 

CAGACTGAGA 

GCCACCGAGT 

GCCATCCGGT 

ACATTGACCC 

TTGTTTGAAG 

TGTGCGGCGT 

GTCATATTCA 

GCAATTTTGG 

CTGATCAAAA 

AGGGAAAGAA 

CCCATCGTGT 

AAACTCACCG 

ATTGCAATCT 

ATGAAGAAAA 

GATACTGTCT 

AGTACCCCAA 

GCATACAGTG 

AGCCTCAAAT 

GAAGCCCAGC 

TACAGGCCTC 

CCCCAAGAAG 

TGTGGGAATG 

CTGCAGAAAG 

ATCTTTCATG 

TATCAGCACA 

GACCTGACTG 

AGCCTGGCCC 

GCCGTGGACG 

GGAAAGACAG 

ATTTTATTAG 

AGAGGGCGCT 

CACCTTTACA 

GATGCTGGTA 

ATTGGCAGCG 

ATGACCTGTG 

ATCGGTCAGC 

GGCGT CACCA 



41 
I 

AGCGAGGCCG 

CAGTGCGACC 

TCGCCACATT 

TAGACACCCT 

GAGTCCTTTG 

TGGTGTGGAA 

TCATCATGGC 

GGACCTCTGG 

TTACCAAAGT 

TGAAGGTGGC 

ACATCTCTGT 

CTGCCTTGTT 

ACGCCTTTTT 

TACCCGTCCA 

TGACAGACAA 

TGTATGCCTG 

AATTACTGGA 

CCACCATAGC 

CACCCGTGGC 

TGCCCTTCTC 

TTCTCATAGA 

TGCTTTTAGC 

AGAAATTGCA 

AGAGGAGTCC 

CGGTTCTGCA 

TCCTGGCTTG 

ATGGATTTTC 

TGGATAGGAC 

TGGGAAGTGG 

GGGTGGTGGC 

GAAATGTGAG 

CAGTCCGCGT 

AGATTGGGGA 

GCGCTGTCTA 

CCCACGTGGG 

TCGTCCTGGT 

AAGATGGAGA 

ATGCAAAACT 

ATGCAGCAAT 

TAATCGGGTA 

CTGCCTTCAG 

GGCCCCAGGG 

ATGTGTACCA 

AAGGCTTCGT 



51 
1 

GCGGAGATCC 60 

CTGTGGAAGG 120 

TTCCTGGCTC 180 

GCCCCCATTG 240 

GGATGAAGAG 300 

ATTCCAGAGG 3 60 

AGCCATAGGG 420 

GAAAGTCTGG 480 

CTTCTTTTGG 540 

GCTCTCCACC 600 

TGGCGAGGTG 66 0 

TTGTCCTTTG 72 0 

CATTCTGGGG 780 

GATGTTTATG 840 

GCGAGTTCAG 900 

GGAGAAATCT 960 

AAAAGCTGGA 1020 

CATCGTGCTG 1080 

ATTTAGTGTG 1140 

CATCAAAGCA 120 0 

TAAAAGCCCC 12 60 

AAATGCCACC 132 0 

GAACCAGAAA 1380 

ACCAGCCAAG 1440 

CAGCATAAGC 150 0 

GAGGTGGCCA 1560 

TGCTAAAGAC 1620 

TCAAAGGGCA 1680 

AAAGAGCTCC 1740 

AGTCAATGGA 1800 

AGAAAACATA 1860 

CTGTGGCCTC 1920 

GCGGGGCCTC 1980 

CTCCGACCGT 2040 

GAAGCACGTC 2100 

GACCCACCAG 2160 

GATTTGTGAA 2220 

GATTCACAAC 2280 

GGTGGAAGCC 2 340 

CCTCCTTTCT 240 0 

CAACTGGTGG 2460 

CAACAGGACC 252 0 

GTGGGTGTAC 2 580 

CTTCACCAAG 2640 



380 



10 



15 



20 



WO 02/086443 

ACCACACTGA TGGCATCCTC 
CCAATGAGTT TCTTTGACAC 
ATGGACGAGC TGGATGTGAG 
ATGGTGGTGT TTATTCTCGT 
GCCAGCCTTG CTGTAGGCTT 
CTCAAGAAGG TGGAGAATGT 
CAGGGCCTGG G CATC ATT CA 
TCCAAAGGCC TGTCATTGTC 
CGAACGGGAA CAGAGACGCA 
TCGACCTGTG TTCCTGAATG 
CCCAGCTGTG GGGAG AT C AC 
CTTGTTCTCG ACAGCCTGAA 
AGAACAGGTT CCGGAAAGTC 
AGTGGCACAA TCTTTATTGA 
AC CAAG CTG A CTGTGATCCC 
TTGGATCCCT TTGAGAGTCA 
ATGAGAGACA CAATAATGAA 
GAAAACTTCT CAGTAGGGGA 
TCAAAGAT CA TTCTCCTTGA 
GTTCAGAACA CCATCAAAGA 
CTCAACACAG TTCTCAACTG 
TTTGACAAGC CTGAAGTCCT 
GCAGAAGTCA GATTGTAG 



PCT/US02/12476 



CTCTCTGCAT 
GACTCCCACT 
GCTGCCGTTT 
GATCTTGGCT 
CTTCATTCTG 
CAGCCGGTCA 
CGCCTATGGC 
AT ACATCAT C 
AGCCAAATTC 
CACTCATCCC 
CTTCAGAGAC 
CTTGAACATA 
ATCGTTAGGA 
TGAGGTGGAT 
ACAGGAT CCT 
CACCGATGAG 
ACT CCCAGAA 
ACGTCAGCTG 
TGAAGCCACC 
TGCCTTCAAG 
CGAT CACGTC 
TGCAGAGAAG 



GACACGGTGT 
GGCAGGCTAA 
CACGCAGAGA 
GCTGTGTTTC 
TTACGCATTT 
CCCTGGTTCA 
AAGAAGGAGA 
CAGCTGAGCG 
ACCTCCGTGG 
CTCAAAGTGG 
TATCAGATGA 
CAAAGTGGGC 
ATGGCTTTGT 
ATCTGCATTC 
GTCCTGTTTG 
ATGCTCTGGC 
AAATTACAGG 
CTTTGTGTGG 
GCCTCTATGG 
GGCTGCACTG 
CTGGTTATGG 
CCAGATT CTG 



TTGATAAGAT 
TGAACCGTTT 
ACTTTCTGCA 
CTGCTGTCCT 
TCCACAGAGG 
CCCACATCAC 
GCTGCATCAC 
GACTGCTCCA 
AGCTGCTCAG 
GGACCTGTCC 
GATACAGAGA 
AGACAGTCGG 
TTCGTCTGGT 
TCAGCTTGGA 
TAGGTACAGT 
AGGTTCTGGA 
CAGAAGTCAC 
CCCGAGCTCT 
ACTCCAAGAC 
TGCTGACCAT 
AAAATGGGAA 
CATTTGCGAT 



CTTAAAGAGC 2700 

TTCCAAGGAT 2760 

GCAGTTTTTT 2820 

TTTAGTCGTG 2 880 

AGTCCAGGAG 2 940 

CTCCTCCATG 3000 

CTATACTTCA 3 0 60 

AGTGTGTGTG 3120 

GGAATACATT 3180 

CAAGGACTGG 3240 

CAACACCCCC 3 300 

GATTGTTGGA 3360 

GGAGCCAGCC 342 0 

AGACCTCAGA 3480 

AAGGTACAAC 3540 

GAGAACATTC 3600 

AGAAAATGGA 3660 

TCTCCGTAAT 3720 

TGACACCCTG 3 780 

CGCCCACCGC 3840 

GGTGATTGAG 3 900 

GTTACTAGCA 3 960 



25 



Seq ID NO: 513 Protein sequence 
Protein Accession #: Eos sequence 



30 



35 



40 



45 



50 



MVGEGPYLIS 
TPVMVKGYRQ 
TRVLMD I VAN 
ALAWAINYRT 
PATIPILMVF 
TMNEFLTCIR 
TLSCHILLRR 
PSYITQPEDP 
GATGPEEQSD 
KDESRRLLTW 
TLAYVSQQAW 
NLSGGQRQRI 
LQFLESCDEV 
FKESPAEREE 
MCEVGAVLAD 
PMSFFDTTPT 
ASLAVGFFIL 
SKGLSLSYII 
PSCGEITFRD 
SGTIFIDEVD 
MRDTIMKLPE 
VQNTIKDAFK 
AEVRL 



11 
I 

DLDQRGRRRS 
RLTVDTLPPL 
ILCIIMAAIG 
AIRLKVALST 
CAAYAFFILG 
LIKMYAWEKS 
KLTAPVAFSV 
DTVLLLANAT 
SLKSVLHSIS 
PQEVDRTQRA 
IFHGNVRENI 
SLARAVYSDR 
ILLEDGEICE 
DAGIIGYLLS 
IGQHVYQWVY 
GRLMNRFSKD 
LRIFHRGVQE 
QLSGLLQVCV 
YQMRYRDNTP 
ICILSLEDLR 
KLQAEVTENG 
GCTVLTIAHR 



21 
I 

FAERYDPSLK 
STYDSSDTNA 
PTVLIHQILQ 
LVFENLVSFK 
PTAIiIGISVY 
FTNTIQDIRR 
IAMFNVMKFS 
LTWEHEASRK 
FWRKLCRYP 
AKYLGKILGI 
LFGEKYDHQR 
QLYLLDDPLS 
KGTHKELMEE 
LFTVFLFLLM 
TASMVFMLVF 
MDELDVRLPF 
LKKVENVSRS 
RTGTETQAKF 
LVLDSLNLNI 
TKLTVIPQDP 
ENFSVGERQL 
LNTVLNCDHV 



31 



41 



51 



TMIPVRPCAR 
KRFRVLWDEE 
QTERTSGKVW 
TLTHISVGEV 
VIFIPVQMFM 
RERKLLEKAG 
IAILPFSIKA 
STPKKLQNQK 
EAQLLAWRWP 
CGNVGSGKSS 
YQHTVRVCGL 
AVDAHVGKHV 
RGRYAKLIHN 
IGSAAFSNWW 
GVTKGFVFTK 
HAENFLQQFF 
PWFTHITSSM 
TSVELLREYI 
QSGQTVGIVG 
VLFVGTVRYN 
LCVARALLRN 
LVMENGKVIE 



LAPNPVDDAG 
VARVGPEKAS 
VGIGLCIALF 
LNILSSDSYS 
AKLNSAFRRS 
FVQSGNSALA 
MAEANVSLRR 
RHLCKKQRSE 
AVFVGRIIRG 
LLAALLGQMQ 
QKDLSNLPYG 
FEECIKKTLR 
LRGLQFKDPE 
LGLWLDKGSR 
TTLMASSSLH 
MWFILVILA 
QGLGIIHAYG 
STCVPECTHP 
RTGSGKSSLG 
LDPFESHTDE 
SKIILLDEAT 
FDKPEVLAEK 



LLSFATFSWL 60 

LSHWWKFQR 120 

ATEFTKVFFW 180 

LFEAALFCPL 240 

AILVTDKRVQ 3 00 

PIVSTIAIVL 3 60 

MKKILIDKSP 420 

AYSERSPPAK 480 

YRPHGFSAKD 540 

LQKGWAVNG 60 0 

DLTEIGERGL 660 

GKTWLVTHQ 72 0 

HLYNAAMVEA 780 

MTCGPQGNRT 840 

DTVFDKILKS 900 

AVFPAVLLW 960 

KKESCITYTS 1020 

LKVGTCPKDW 1080 

MALFRLVEPA 1140 

MLWQVLERTF 120 0 

ASMDSKTDTL 12 60 

PDSAFAMLLA 132 0 



55 



Seq ID NO: 514 DNA sequence 
Nucleic Acid Accession #: Z31560 
Coding sequence: 1-966 



60 



65 



70 



75 



CACAGCGCCC 
ACTTCGGGGG 
AGCCCGGACC 
CGCAAGATGG 
GCCGAGTGGA 
CTGCGAGCGC 
AAGACGCTCA 
AAT AG CAT GG 
ATGGACAGTT 
CAGCTGGGCT 
ATGCACCGCT 
ATGAACGGCT 
CTTGGCTCCA 
TCTTCCTCCC 
TATCTCCCCG 
CACTACCAGA 
ATGTGAGGGC 
TGGGAGGGGT 
AAAAA 



11 
I 

GCATGTACAA 
GCGGCGGCGG 
GCGTCAAGCG 
CCCAGGAGAA 
AACTTTTGTC 
TGCACATGAA 
TGAAGAAGGA 
CGAGCGGGGT 
ACGCGCACAT 
ACCCGCAGCA 
ACGACGTGAG 
CGCCCACCTA 
TGGGTTCGGT 
ACTCCAGGGC 
GCGCCGAGGT 
GCGGCCCGGT 
CGGACAGCGA 
GCAAAAGAGG 



21 
I 

CATGATGGAG 
CAACTCCACC 
GCCCATGAAT 
CCCCAAGATG 
GGAGACGGAG 
GGAGCACCCG 
TAAGTACACG 
CGGGGTGGGC 
GAACGGCTGG 
CCCGGGCCTC 
CGCCCTGCAG 
CAGCATGTCC 
GGT CAAGTCC 
GCCCTGCCAG 
GCCGGAACCC 
GCCCGGCACG 
ACTGGAGGGG 
AGAGTAAGAA 



31 
! 

ACGGAGCTGA 
GCGGCGGCGG 
GCCTTCATGG 
CACAACT CGG 
AAGCGGCCGT 
GATTATAAAT 
CTGCCCGGCG 
GCCGGCCTGG 
AGCAACGGCA 
AATG CGCACG 
TACAACTCCA 
TACTCGCAGC 
GAGGCCAGCT 
GCCGGGGACC 
GCCGCCCCCA 
GCCATTAACG 
GGAGAAATTT 
ACAGCATGGA 



41 
I 

AGCCGCCGGG 
CCGGCGGCAA 
TGTGGTCCCG 
AGAT CAGCAA 
TCATCGACGA 
ACCGGCCCCG 
GGCTGCTGGC 
GCGCGGGCGT 
GCTACAGCAT 
GCGCAGCGCA 
TGACCAGCTC 
AGGGCACCCC 
CCAGCCCCCC 
TCCGGGACAT 
GCAGACTTCA 
GCACACTGCC 
TCAAAGAAAA 
GAAAACCCGG 



51 
! 

CCCGCAGCAA 60 

CCAGAAAAAC 12 0 

CGGGCAGCGG 180 

GCGCCTGGGC 240 

GGCTAAGCGG 3 00 

GCGGAAAACC 3 60 

CCCCGGCGGC 42 0 

GAACCAGCGC 480 

GATGCAGGAC 540 

GATGCAGCCC 600 

GCAGACCTAC 660 

TGGCATGGCT 72 0 

TGTGGTTACC 780 

GATCAGCATG 840 

CATGT CCCAG 90 0 

CCTCTCACAC 960 

ACGAGGGAAA 102 0 

TACGCTCAAA 1080 



80 



Seq ID NO: 515 Protein sequence 
Protein Accession #: CAA83435 



1 11 21 31 41 51 

BC I I I 1 1 1 

OJ HSARMYNMME TELKPPGPQQ TSGGGGGNST AAAAGGNQKN SPDRVKRPMN AFMVWSRGQR 60 

RKMAQENPKM HNSEISKRLG AEWKLLSETE KRPFIDEAKR LRALHMKEHP DYKYRPRRKT 120 
KTLMKKDKYT LPGGLLAPGG NSMASGVGVG AGLGAGVNQR MDSYAHMNGW SNGSYSMMQD 180 



381 



10 



15 



20 



25 



WO 02/086443 

QLGYPQHPGL NAHGAAQMQP MHRYDVSALQ YNSMTSSQTY MNGSPTYSMS YSQQGTPGMA 
LGSMGSWKS EASSSPPWT SSSHSRAPCQ AGDLRDMISM YLPGAEVPEP AAPSRLHMSQ 
HYQSGPVPGT AINGTLPLSH M 

Seq ID NO: 516 DNA sequence 
Nucleic Acid Accession #: U91618 



PCT/US02/12476 



Coding sequence: 29.. 541 



1 

I 

CGGACTTGGC 
CATGCTACTC 
AGCATTAGAA 
TCCCTCTTGG 
AGCTGAGGAA 
TGCTTTAGAT 
TCACAGCAGG 
TGACAAAAAT 
GCTGTATGAG 
AGAGAATAAA 
ATTATATTTG 
ATTGAATGTG 
T CTTCAAAAA 



11 



21 



I 



i 



TTGTTAGAAG 
CTGGCTTTCA 
GCAGATTTCT 
AAGATGACTC 
ACAGGAGAAG 
GGCTTTAGCT 
GCTTTTCAAC 
GGAAAGGAAG 
AATAAACCCA 
TCATTTATTT 
TGTGAAAATG 
TTTTTCTGCA 
AAAAAAAAAA 



GCTGAAAGAT 
GCTCCTGGAG 
TGACCAATAT 
TGCTAAATGT 
TTCATGAAGA 
TGGAAGCAAT 
ACTGGGAGTT 
AAGT CAT AAA 
GAAGACCCTA 
ACATGTGATT 
TGACAAACAC 
CTAATAGAAA 
AAATGGGGCC 



31 
I 

GATGGCAGGA 
TCTGTGCTCA 
GCATACATCA 
TTGCAGTCTT 
GGAGCTTGTT 
GTTGACAATA 
AAT CCAGGAA 
GAGAAAAATT 
CATACTCAAA 
GTG ATT CATC 
ACTTATCTGT 
TTAGACTAAG 
GCAATT 



41 
I 

ATGAAAATCC 
GATTCAGAAG 
AAGATTAGTA 
GTAAATAATT 
GCAAGAAGGA 
TACCAGCTCC 
GATATTCTTG 
CCTTATATTC 
AGAGATTCTT 
ATCCCTTAAT 
CTCTTCTACA 
TGTTTTCAAA 



51 
I 

AGCTTGTATG 
AGGAAATGAA 
AAGCACATGT 
TGAACAGCCC 
AACTTCCTAC 
ACAAAATCTG 
ATACTGGAAA 
TGAAACGGCA 
ACTATTACTG 
TAAATAT CAA 
ATTGTGGTTT 
TAAATCTAAA 



Seq ID NO: 517 Protein sequence 
Protein Accession #: AAB50564 



240 
300 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
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35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



1 11 21 31 41 SI 

I I I I I I 

MMAGMKIQLV CMLLLAFSSW SLCSDSEEEM KALEADFLTN MHTSKISKAH VPSWKMTLLN 

VCSLVNNLNS PAEETGEVHE EELVARRKLP TALDGFSLEA MLTIYQLHKI CHSRAFQHWE 

LIQEDILDTG NDKNGKEEVI KRKIPYILKR QLYENKPRRP YILKRDSYYY 

Seq ID NO: 518 DNA sequence 

Nucleic Acid Accession #: NM_006536.2 

Coding sequence: 10 9.. 2 940 



60 
120 



11 



I 



I 



85 



ACCTAAAACC 
ATGTATGCAG 
AGCATTGCAG 
GAACTCCCAT 
ATTGCAATTA 
ATAACTGAAG 
AT AAAGAT T T 
TCATATGAAA 
TACACCCTAC 
TTCCTACTGA 
GAATGGGCCC 
ATAAATGGGC 
GTGTGTGAAA 
GGATGCACCT 
AGTTTATCTT 
CTACAGAACC 
TTTCACCACA 
GTACAGGCTG 
GCTGACAGAC 
ATTCATACCT 
CACCAAATTA 
TCAGCTAAAA 
AAACTGAATG 
CTTCTTGGCA 
CTGGGTTCAT 
TTCTTTGTTC 
T CTGGAACTG 
AAACCTCACC 
ATGTTTCTAG 
GGACGAAAAT 
TGGATTCCAG 
TCTCTGCAAG 
GCCACTGTGG 
TATGCCAATG 
GAG CCAG AG A 
GTTATAAAAA 
TATAGCTTGA 
CCAGGGAGTC 
GCTCCAAGGA 
AGCTCAGGAG 
CCACCATGCA 
TGGACAGCAC 
AGTAAAAGTC 
AAGCGAAATC 
ACGAATGGAC 
GCAATACGAG 
CCTCTGTTTA 
GGAGTTTTAA 



TTGCAAGTTC 
CAGGCT CAGT 
GTCCTATTTG 
TCCTGGGAGC 
ATCCTCAGGT 
CTTCATTTTA 
TAATACCTGC 
AGGCAAATGT 
AATACAGAGG 
ATGATAACTT 
ACCTCCGTTG 
AAAATCAAAT 
AAGGTCCTTG 
TTATCTACAA 
CTGTGGTTGA 
AGATGTGCAG 
GCTTTCCCAT 
GTGACAAAGT 
TCCTTCAACT 
TCGTGGGCAT 
ACAGCAATGA 
CAGAC AT CAG 
GAAAAGCTTA 
ATTGCTTACC 
CTGCAGCCCC 
CAGATATATC 
GAGACATTTT 
ATCAATTGAA 
TTACGTGGCA 
ACTACACAAA 
GAACAGCTAA 
CCCTGAAAGT 
AAGCCTTTGT 
TGAAACAGGG 
CTGGAGATCC 
ATGATGGAAT 
AAGTGCATGT 
ATGCTATGTA 
AATCAGTAGG 
GCTCCTTTTC 
AAATTATTGA 
CTGGAGAAGA 
TACAGAATAT 
CTCAGCAAGC 
CTGAACATCA 
CAATGGATAG 
TTCCCCCCAA 
CAGCAATGGG 



21 
I 

AGGAAGAAAC 
GTGAGTGAAC 
CAACCTGAAG 
TGGAGTACAG 
ACCTGAGAAT 
CCTATTTAAT 
CACATGGAAA 
CATAGTGACT 
GTGTGGAAAA 
AACAGCTGGC 
GGGTGTGTTC 
TAAAGTGACA 
CCCCCAAGAA 
TAGCACCCAA 
ATTTTGTAAT 
CCTCAGAAGT 
GAATGGGACT 
GGTCTGTTTA 
ACAACAAGCC 
TGCCAGTTTC 
TG AT CGAAAG 
CATTTGTTCA 
TGGCTCTGTG 
CACTGTGCTC 
AAAT CTGG AG 
AAACTCCAAT 
C CAG CAA CAT 
AAACACAGTG 
GGCCAGTGGT 
TAATTTTATC 
GCCTGGGCAC 
GACAGTGACC 
GGAAAGAGAC 
ATTTTATCCC 
TGTTACGCTG 
TTACTCGAGG 
CAATCACTCT 
TGTACCAGGT 
CAGAAATGAG 
AGTGCTGGGA 
CCTGGAAGCT 
CTTTGATCAG 
CCAAGATGAC 
TGGCATCAGG 
GCCAAATGGA 
GAACTCCTTA 
TTCTGATCCT 
TTTGATAGGA 



31 
I 

CATCTGCATC 
TGGAGGCTTC 
TTTGTGACTC 
CTTCAAGACA 
CAGAACCTCA 
GCTACCAAGA 
GCTAATAATA 
GACTGGTATG 
GAGGGAAAAT 
TACGGATCAC 
GATGAGTATA 
AGGTGTT CAT 
AACTGTATTA 
AATGCAACTG 
GCAAGTACCC 
GCATGGGATG 
GAGCTTCCAC 
GTGCTGGATG 
GCAGAATTTT 
GACAGCAAAG 
TTGCTGGTTT 
GGGCTTAAGA 
ATGATATTAG 
AGCAGTGGTT 
GAAT TATCAC 
AGCATGATTG 
ATTCAGCTTG 
ACTGTGGATA 
CCTCCTGAGA 
ACCAATCTAA 
TGGACTTACA 
TCTCGCGCCT 
AGCCTCCATT 
ATTCTTAATG 
AGACTCCTTG 
TATTTTTTCT 
CCCAGCATAA 
TACACAGCAA 
GAGGAGCGAA 
GTTCCAGCTG 
GTAAAAGTAG 
GGCCAGGCTA 
TTTAACAATG 
GAGATATTTA 
GAAACACATG 
CAGTCTGCTG 
GTACCTGCCA 
ATCATTTGCC 



41 
I 

CATATTGAAA 
TCTACAACAT 
TCCTGGTTGC 
ATGGGTATAA 
TCTCAAACAT 
GAAGAGTATT 
ACAGCAAAAT 
GGGCACATGG 
ACATTCATTT 
GAGGCCGAGT 
ACAATGACAA 
CTGACATCAC 
TTAGTAAGCT 
CATC AAT AAT 
ACAACCAAGA 
TAATCACAGA 
CTCCTCCCAC 
TGT CCAGCAA 
ATTTGATGCA 
GAGAGATCAG 
CATATCTGCC 
AAGGATTTGA 
TGACCAGCGG 
CAACAATTCA 
GTCTTACAGG 
ATGCTTTCAG 
AAAGTACAGG 
ATACTGTGGG 
TTATATTATT 
CTTTTCGGAC 
CCCTGAACAA 
CCAACTCAGC 
TTCCTCATCC 
CCACTGTCAC 
ATGATGGAGC 
CCTTTGCTGC 
GCACCCCAGC 
ACGGTAATAT 
AGTGGGGCTT 
GCCCCCACCC 
AAGAGGAATT 
CAAGCTATGA 
CTATTTTAGT 
CGTTCTCACC 
AAAGCCACAG 
TATCTAACAT 
GAGATTATCT 
TTATTATAGT 



51 
I 

ACCTGACACA 
GACCCAAAGG 
CTTAAGTTCA 
TGGATTGCTC 
TAAGGAAATG 
TTTCAGAAAT 
AAAACAAGAA 
AGATGATCCA 
CACACCTAAT 
GTTTGTCCAT 
ACCTTTCTAC 
AGGCATTTTT 
TTTTAAAGAA 
GTTCATGCAA 
AGCACCAAAC 
CTCTGCTGAC 
ATTCTCGCTT 
GATGGCAGAG 
GATTGTTGAA 
AGCCCAGCTA 
CACCACTGTA 
GGTGGTTGAA 
AGATGATAAG 
CTCCATTGCC 
AGGTTTAAAG 
TAG AAT T T C C 
TGAAAATGT C 
CAACGACACT 
TGATCCTGAT 
AGCTAGTCTT 
TACCCATCAT 
TGTGCCCCCA 
TGTGATGATT 
TGCCACAGTT 
AGGTGCTGAT 
AAATGGTAGA 
CCACTCTATT 
TCAGATGAAT 
TAGCCGAGTC 
TGATGTGTTT 
GACCCTATCT 
AATAAGAATG 
AAAT ACAT CA 
CCAGATTTCC 
AATTTATGTT 
TGCCCAGGCG 
TATATTGAAA 
TGTGACACAT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
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10 



15 



25 



30 



WO 02/086443 

CATACTTTAA GCAGGAAAAA 
ATAAATATCC AAAGTGTCTT 
CATACTAACA AAGTCAAATT 
ATACAGATAA GATTTTTACA 
CCTTACACTT TGGCTATGAA 
GCAAAGGGAA GGGTAAAGTC 
AATAGCCCCA AG CAG AGAAA 
TCATTTAGTT ACTTTGATTA 
TTTACATGAA GATCATGCTA 
CTTGCTATTT TGTTATATAT 
TTTCACTGTA AGAGGTAACC 
TTTATGACAA AGGTCTATTG 
TTTCTAAGTT TATTGCCTTG 
TACCTAGGAA A 



PCT/US02/12476 



GAGAGCAGAC 
CCTT CTTAGA 
AACATCAAAA 
TGGT AG AT CA 
CAAATAATAA 
GGACCAGTGT 
AGGAGGGTAG 
ATTTTTCTTT 
TATTTTATAT 
ATTT CAGATG 
TTTAACAATA 
AATTTATTTG 
GGTTATTATG 



AAGAAAGAGA 
TATAAGACCC 
CTGTATTAAA 
ACAATTCTTT 
AAATTATTCT 
CAAGGAAAGT 
GTCTGCATTA 
TCTCCTTATC 
ATGTAGCCCC 
ACATCTCCCT 
TGGGTATTAC 
TNTGTAAGTT 
GAATGATAGT 



ATGGAACAAA 
ATGGCCTTCG 
ATGCATTGAG 
TTGGGGGTAG 
TTAAAGTAAT 
TTGTTTTATT 
TAACTGTCTG 
TGTGCAGTAC 
TAATGCAAAG 
GCTAATGCTC 
CTTTGTCTCT 
TCTACTCCCA 
TATAGCCCCN 



ATTATTATAA 
ACTACAAAAA 
TTTTTGTACA 
ATTAGAAAAC 
GTCTTTAAAG 
GAGGTGGAAA 
TGTGAAGCAA 
AGGTTGCTTG 
CTCTTTACCT 
AGAGATCTTT 
TCATACCGGT 
TCAAAGCAGC 
TATAATGCCT 



Seq ID NO: 519 Protein sequence 
Protein Accession #: NP_006527.1 



20 | 



ii 



35 



MTQRSIAGPI 
IKEMITEASF 
GDDPYTLQYR 
KPFYINGQNQ 
MFMQSLSSW 
TFSLVQAGDK 
RAQLHQINSN 
GDDKLLGNCL 
SRISSGTGDI 
FDPDGRKYYT 
AVPPATVEAF 
AGADVI KNDG 
IQMNAPRKSV 
LTLSWTAPGE 
PQISTNGPEH 
h I LKGVLT AM 



CNLKFVTIjLV 
YLFNATKRRV 
GCGKEGKYIH 
IKVTRCSSDI 
EFCNASTHNQ 
WCLVLDVSS 
DDRKLLVSYL 
PTVLSSGSTI 
FQQHIQLEST 
NNF I TNIiTFR 
VERDSLHFPH 
I YSRYFFSFA 
GRNEEERKWG 
DFDQGQATSY 
QPNGETHESH 
GLIGIICLII 



21 
I 

ALSSELPFLG 
FFRNIKILIP 
FTPNFLLNDN 
TGIFVCEKGP 
EAPNLQNQMC 
KMAEADRLLQ 
PTTVSAKTDI 
HSIALGSSAA 
GENVKPHHQL 
TASLWIPGTA 
PVMIYANVKQ 
ANGRYSLKVH 
FSRVSSGGSF 
EIRMSKSLQN 
RIYVAIRAMD 
WTHHTLSRK 



31 



41 



AGVQLQDNGY 
ATWKANNNSK 
LTAGYGSRGR 
CPQENCIISK 
SLRSAWDVIT 
LQQAAEFYLM 
SICSGLKKGF 
PNLEELSRLT 
KNTVTVDNTV 
KPGHWTYTLN 
GFYPILNATV 
VNHSPSISTP 
SVLGVPAGPH 
IQDDFNNAIL 
RNSLQSAVSN 
KRADKKENGT 



NGLLIAINPQ 
IKQESYEKAN 
VFVHEWAHLR 
LFKEGCTFIY 
DSADFHHSFP 
QIVEIHTFVG 
EWEKLNGKA 
GGLKFFVPDI 
GNDTMFLVTW 
NTHHSLQALK 
TATVEPETGD 
AHSIPGSHAM 
PDVFPPCKII 
VNTSKRNPQQ 
IAQAPLFIPP 



51 
I 

VPENQNLISN 
V I VTDWYGAH 
WGVFDEYNND 
NSTQNATASI 
MNGTELPPPP 
IASFDSKGEI 
YGSVMILVTS 
SNSNSMIDAF 
QASGPPEIIIi 
VTVTSRASNS 
PVTLRLLDDG 
YVPGYTANGN 
DLEAVKVEEE 
AGIREIFTFS 
NSDPVPARDY 



2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
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720 
780 
840 
900 
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Seq ID NO: 520 DNA sequence 

Nucleic Acid Accession #: NM_000228.1 

Coding sequence: 82.. 3 60 0 
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GCTTTCAGGC 
GGATCACCCC 
CTCCTGCATG 
CTTGTTGGGA 
ACCTACTGCA 
CCTCACAACT 
TGGTGGCAGT 
TTCCAGCTTC 
GAGCGCTCCT 
ACCTCCACCT 
CAGTCCCTGC 
ATGGATTTAG 
ATCACAAACT 
CCTCCCAGCG 
GGCCATGCTG 
CAGGTCCACG 
GCACCCTTCT 
CAAAGGTGCG 
GCCAGCCAGG 
AACTGTGAGC 
GAGACCTGCA 
CCAGTGACCG 
AAGCCGGGCT 
AACATCCTGG 
CTGCCCAACG 
AGTGGCCAGG 
CAACCAGTTC 
GCAGCCATCC 
TGTGACTGTG 
CTCTGCCGCC 
CGCTACCCGG 
GAGCAGGCCC 
GGGCTGGAGG 
ATCCGAGCAG 
GCCATCCTCT 
GAGACGTTGT 
ACTATGTATC 
GCCTTCCGGA 
GACAGCTCGC 
CGGCAGGCGG 
ATGTCTTCGT 
ATGGCTTGCA 
TGTGGCTCCC 
CAGGTGGCTG 



11 

I 

GATCTGGAGA 
ATTGGCTGAA 
CCCAACAAGC 
GGACCCGGTT 
CCCAGTATGG 
ACTACAGTCA 
CCCAGAATGA 
AAGAAGT CAT 
CAGACTT CGG 
TCCCTCGGGT 
CTCAGAGGCC 
TGTCTGGGAT 
TGAGAGTCAA 
CCTACTATGC 
ATCGCTGCGC 
ATGTCTGTGT 
ACAACAACCG 
ACTGCAATGG 
GGGCATATGG 
GGTGTCAGCT 
TCTCCTGCGA 
GGCAGTGTGT 
TCACTGGACT 
GGTCCCGGAG 
TGGTGGGTCC 
GCTGTGAACC 
ACAGGGCAGT 
GCCAGTGTCC 
ATTTCCGGGG 
CTGGCTTGAC 
TGTGCGTGGC 
TGCGCTTTGG 
ACCGTGGCCT 
TTCTCAGCAG 
CCCTCAGGCG 
CCCTTCCGAG 
AGAGGAAGAG 
TGCTGAGCAC 
GCCTTTTGGA 
GAGGAGGAGG 
TGCCTGACCT 
CCCCAATATC 
GCTGCAGGGG 
AGCAGCTGCG 



21 
I 

AAGAACGGCA 
GATGAGACCA 
CTGCTCCCGT 
TCTCCGAGCT 
CGAGTGGCAG 
CCGAGTAGAG 
TGTGAACCCT 
GATGGAGTTC 
TAAGACCTGG 
CCGCCAGGGT 
TAATGCACGC 
TCCAGCAACT 
TTTCACCAGG 
TGTGTCCCAG 
ACCCAAGCCT 
CTGCCAGCAC 
GCCCTGGAGA 
GCACTCAGAG 
AGGTGTGTGT 
GCACTATTTC 
GTGTGATCCG 
GTGCAAGGAG 
CACCTACGCC 
GGACATGCCG 
CAAATGTGAC 
GTGTGCCTGC 
GCCCTGTCGG 
AGACCGGACC 
AACAGAGGGC 
CGGGCCCCGC 
CTGCCACCCT 
TAGACTCCGC 
GGCCTCCCGG 
CCCCGCAGTC 
AACTCTCCAG 
AGACCTGGAG 
GGAGCAGTTT 
AGCCTACGAG 
CCAGCTCAGG 
AGGCACCGGC 
GACACCCACC 
ATGCCCTGGT 
TGTCCTTCCC 
GGGCTTCAAT 



31 
I 

GAACACACAG 
TTCTTCCTCT 
GGGGCCTGCT 
TCATCTACCT 
ATGAAATGCT 
AATGTGGCTT 
GTCTCTCTGC 
CAGGGGCCCA 
CGAGTGTACC 
CGGCCTCAGA 
CTAAATGGGG 
CAAAGTCAAA 
CTGGCCCCTG 
CTCCGTCTGC 
GGGGCCTCTG 
AACACTGCCG 
CCGGCGGAGG 
ACATGTCACT 
GACAATTGCC 
CGGAACCGGC 
GATGGGGCAG 
CATGTGCAGG 
AACCCGCAGG 
TGTGACGAGG 
CAGTGTGCTC 
GACCCGCACA 
GAAGGCTTTG 
TATGGAGACG 
CCGGGCTGCG 
TGTGACCAGT 
TGCTTCCAGA 
AATGCCACCG 
ATCCTAGATG 
ACAGAGCAGG 
GGCCTGCAGC 
AGTCTTGACA 
GAAAAAATAA 
CAGTCAGCCC 
GACAGCCGGA 
AGCCCCAAGC 
TTCAACAAGC 
GAGCTATGTC 
AGGGCCGGTG 
GCCCAGCTCC 



41 

I 

CAAGGAAAGG 
TGTGTTTTGC 
ATCCACCTGT 
GTGGACTGAC 
GCAAGTGTGA 
CATCCTCCGG 
AGCTGGACCT 
TGCCCGCCGG 
AGTACCTGGC 
GCTGGCAGGA 
GGAAGGTCCA 
AAATTCAAGA 
TGCCCCAAAG 
AGGGGAGCTG 
CAGGCCCCTC 
GCCCAAATTG 
GCCAGGACGC 
TTGACCCCGC 
GGGACCACAC 
GCCCGGGAGC 
TGCCAGGGGC 
GAGAGCGCTG 
GCTGCCACCG 
AGAGTGGGCG 
CCTACCACTG 
ACTCCCCTCA 
GTGGCCTGAT 
TGGCCACAGG 
ACAAGGCATC 
GCCAGCGAGG 
CCTATGATGC 
CCAGCCTGTG 
CAAAGAGTAA 
AGGTGGCTCA 
TGGATCTGCC 
GAAGCTTCAA 
GCAGTGCTGA 
AGGCTGCTCA 
GAGAGGCAGA 
TTGTGGCCCT 
TCTGTGGCAA 
CCCAAGACAA 
GGGCCTTCTT 
AGCGGACCAG 



51 
I 

TCCTTTCTGG 60 

CCTGCCTGGC 120 

TGGGGACCTG 180 

CAAGCCTGAG 240 

CTCCAGGCAG 3 00 

CCCCATGCGC 3 60 

GGACAGGAGA 420 

CATGCTGATT 480 

TGCCGACTGC 54 0 

TGTTCGGTGC 60 0 

ACTTAACCTT 660 

GGTGGGGGAG 72 0 

GGGCTACCAC 780 

CTTCTGTCAC 840 

CACCGCTGTG 900 

TGAGCGCTGT 960 

CCATGAATGC 102 0 

TGTGTTTGCC 1080 

CGAAGGCAAG 1140 

TTCCATTCAG 1200 

TCCCTGTGAC 1260 

TGACCTATGC 1320 

CTGTGACTGC 13 80 

CTGCCTTTGT 1440 

GAAGCTGGCC 150 0 

GCCCACAGTG 1560 

GTGCAGCGCT 1620 

ATGCCGAGCC 1680 

AGGCCGCTGC 1740 

CTACTGCAAT 180 0 

GGACCTCCGG 1860 

GTCAGGGCCT 1920 

GATTGAGCAG 1980 

GGTGGCCAGT 2040 

CCTGGAGGAG 2100 

TGGTCTCCTT 2160 

TCCTTCAGGA 222 0 

GCAGGTCTCC 2280 

GAGGCTGGTG 2340 

GAGGCTGGAG 2400 

CTCCAGGCAG 2460 

TGGCACAGCC 2520 

GATGGCGGGG 2580 

GCAGATGATT 2 640 



383 



10 



15 



20 



WO 02/086443 

AGGGCAGCCG AGGAATCTGC 
GTGAGCGCCA GCCGCTCCCA 
CAGGTCCGGG ACTTCCTAAC 
GAGGCCGTGC TGGCCCTGTG 
GAGATCCAGG CCATTGCAGC 
CAGGACATTG CGCGTGCCCG 
CATGCAGTGG AGGGCCAGGT 
CTGCAGGAAG CTCAGGACAC 
AGGGTTGCTG AGGTTCAGCA 
AAGCAGCTGG GTGACTTCTG 
GGGGCAGAGG CAGTCCAGGC 
GCCCAAGAGG GATTTGAGAG 
CAGAGTT CCA TGCTGGGTGA 
GAGCTGTTTG GGGAGACCAT 
CTGCGGGGCA GCCAGGCCAT 
GTGGAGCAGA TCCGTGACCA 
TGCTACAGCT TCCAGCCCGT 
GATTGGGTTG GAATGCTTTC 
GACCACCCCT GGTGTGTAGC 
GGGACAGTTA CACTTGACAG 
CTCTCAAGTC AAGGAAGCTG 
GGAATCCTGG ACCAAGCACA 
AAAATCTTTG G 
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CTCACAGATT 
GATGGAGGAA 
AGACCCCGAC 
GCTGCCCACA 
CAGGCTCCCC 
CCGGTTGCAG 
GGAAGATGTG 
CATGCAAGGC 
GGTACTGCGG 
GACACGGATG 
CCAGCAGCTT 
AATAAAACAA 
GCAGGGTGCC 
GGAGATGATG 
CATGCTGCGC 
CATCAATGGG 
TGCCCCACTC 
CATCTCCAGG 
TAGTAAGATT 
ACAAAGATGG 
GGCTGGGCAG 
AAAACTTAAC 



CAATCCAGTG 
GATGTCAGAC 
ACTGATGCAG 
GACTCAGCTA 
AACGTGGACT 
GCTGAGGCTG 
GTTGGGAACC 
ACCAGCCGCT 
CCAGCAGAAA 
GAGGAGCTCC 
GCGGAAGGTG 
AAGTATGCTG 
CGGATCCAGA 
GACAGGATGA 
TCGGCGGACC 
CGCGTGCTCT 
ATCTGCCGCC 
AGACTTTCAT 
ACCCTGAGCT 
TGGAGATTGG 
TATCCCCCGC 
AAAAGTGATG 



CCCAGCGCTT 
GCACACGGCT 
CCACTATCCA 
CTGTTCTGCA 
TGGTGCTGTC 
AGGAAGCCAG 
TGCGGCAGGG 
CCCTTCGGCT 
AGCTGGTGAC 
GCCACCAAGC 
CCAGCGAGCA 
AGTTGAAGGA 
GTGTGAAGAC 
AAGACATGGA 
TGACAGGACT 
ACTATGCCAC 
TTTGCTTTTG 
GCAGCCTAAA 
GCAGCTGAGC 
CATGCCATTG 
CTTTAGTTCT 
TAAAAATGAA 



GGAGACCCAG 2 700 

CCTAAT CCAG 2 760 

GGAGGTCAGC 2820 

GAAGATGAAT 2 880 

CCAGACCAAG 2940 

GAGCCGAGCC 3 00 0 

GACAGTGGCA 3060 

TATCCAGGAC 312 0 

AAGCATGACC 3180 

CCGGCAGCAG 3240 

GGCATTGAGT 3300 

CCGGTTGGGT 3 360 

AGAGGCAGAG 3420 

GTTGGAGCTG 3480 

GGAGAAGCGT 3 540 

CTGCAAGTGA 3 600 

GTTGGGGGCA 3 660 

GTACAGCCTG 372 0 

CTGAGCCAAT 3780 

AAACTAAGAG 3840 

CCACTGGGGA 3 900 

AAGC CAAAT A 3 960 
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Seq ID NO: 521 Protein sequence 
Protein Accession #: NP 000219.1 
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MRPFFLLCFA 
EWQMKCCKCD 
MEFQGPMPAG 
NARIiNGGKVQ 
VSQLRLQGSC 
PWRPAEGQDA 
HYFRNRRPGA 
TYANPQGCHR 
CACDPHNSPQ 
TEGPGCDKAS 
RLRNATASLW 
TLQGLQLDLP 
AYEQSAQAAQ 
TPTFNKLCGN 
GFNAQLQRTR 
DPDTDAATIQ 
RLQAEAEEAR 
VLRPAEKLVT 
IKQKYAEIiKD 
MLRSADLTGL 



11 



LPGLLHAQQA 
SRQPHNYYSH 
MLIERSSDFG 
LNLMDLVSGI 
FCHGHADRCA 
HECQRCDCNG 
SIQETCISCE 
CDCNILGSRR 
PTVQPVHRAV 
GRCLCRPGLT 
SGPGLEDRGL 
LEEETLSLPR 
QVSDSSRLLD 
SRQMACTPIS 
QMIRAAEESA 
EVSEAVLALW 
SRAHAVEGQV 
SMTKQLGDFW 
RLGQSSMLGE 
EKRVEQ I RDH 



21 
I 

CSRGACYPPV 
RVENVASSSG 
KTWRVYQYLA 
PATQSQKIQE 
PKPGASAGPS 
HSETCHFDPA 
CDPDGAVPGA 
DMPCDEESGR 
PCREGFGGLM 
GPRCDQCQRG 
ASRILDAKSK 
DLESLDRSFN 
QLRDSRREAE 
CPGELCPQDN 
SQIQSSAQRL 
LPTDSATVLQ 
EDWGNLRQG 
TRMEELRHQA 
QGARIQSVKT 
INGRVLYYAT 



31 
I 

GDLLVGRTRF 
PMRWWQSQND 
ADCTSTFPRV 
VGEITNLRVN 
TAVQVHDVCV 
VFAASQGAYG 
PCDPVTGQCV 
CLCLPNWGP 
CSAAAIRQCP 
YCNRYPVCVA 
IEQIRAVLSS 
GLLTMYQRKR 
RLVRQAGGGG 
GTACGSRCRG 
ETQVSASRSQ 
KMNEIQAIAA 
TVALQEAQDT 
RQQGAEAVQA 
EAEELFGETM 
CK 



41 



51 



LRASSTCGLT 
VNPVSLQLDL 
RQGRPQSWQD 
FTRLAPVPQR 
CQHNTAGPNC 
GVCDNCRDHT 
CKEHVQGERC 
KCDQCAPYHW 
DRTYGDVATG 
CHPCFQTYDA 
PAVTEQEVAQ 
EQFEKISSAD 
GTGSPKLVAL 
VLPRAGGAFL 
MEEDVRRTRL 
RLPNVDLVLS 
MQGTSRSLRL 
QQLAEGASEQ 
EMMDRMKDME 



KPETYCTQYG 
DRRFQLQEVM 
VRCQSLPQRP 
GYHPPSAYYA 
ERCAPFYNNR 
EGKNCERCQL 
DLCKPGFTGL 
KLASGQGCEP 
CRACDCDFRG 
DLREQALRFG 
VASAILSLRR 
PSGAFRMLST 
RLEMSSLPDL 
MAGQVAEQLR 
IjIQQVRDFLT 
QTKQDIARAR 
IQDRVAEVQQ 
ALSAQEGFER 
LELLRGSQAI 



Seq ID NO: 522 DNA sequence 

Nucleic Acid Accession #: NM_001944.1 

Coding sequence: 84.. 3083 



85 



TTTTCTTAGA 
TTTCACCAGG 
CCATCTTCGT 
ATGATGAAGA 
AATTTGCCAA 
TTACTTCAGA 
ATCAGCCGCC 
CTATAGTCGA 
AAGGACTAGA 
ATCCTCCAGT 
ACTCACTGGT 
AAATTGCCTT 
GAAACACTGG 
ATCGT CTGGT 
GTAATATTAA 
CAGCACGTAT 
TGGATGAAGA 
GAAATTGGTT 
AGGCTCTAGA 
CTGAATTTCA 
AGGTAATAAA 
AAAAAGGCAT 
ATGAGGACAC 
GATACCTAAT 
ATTCTACTTT 
CGGGTAAAAC 
CAACAGCTGT 
CTAGAACACT 
TAAAGTTGCC 
CCCAGGAACA 
ACAAT CGGTG 



11 

I 

CATTAACTGC 
GAAATCAGAG 
GGTGGTCATA 
AGAGATGACT 
ACCCTGCAGA 
TTACCAAGCA 
TTTTGGAATC 
CCGGGAGGAA 
TGTAGAGAAA 
ATTTTCACAA 
GATGATACTA 
CAAAATTGTC 
GGAAGTCCGT 
TGTGAGTGGT 
AGTGAAAGAT 
TGAAGAAAAT 
GTACACAGAT 
TGAAATACAA 
TTATGAACAA 
CCAATCAGTT 
TGTAAGAGAA 
AAGTAGCAAA 
TAACAAAGCT 
GATTGATTCA 
CATAGTTAAC 
TTCTACAGGC 
CCTCGAAAAA 
GAATAATAGA 
TGCCGTATGG 
GATACCTCCT 
TGAGATGCCA 



21 
I 

AGACGGCTGG 
ACAATGATGG 
TTGGTTCATG 
ATGCAACAAG 
GAAGGAGAAG 
ACCCAGAAAA 
TTTGTTGTTG 
ACTCCAAGCT 
CCACTTATAC 
CAAATTT TCA 
AATGCCACAG 
TCTCAGGAAC 
ACTTTGACCA 
GCAGACAAAG 
GTCAACGATA 
ATTTTAAGTT 
AATTGGCTTG 
ACTGATCCTA 
CTACAAAGCG 
ATCTCTCGAT 
GGAATTGCAT 
AAATTGGTGG 
GCCTCAAATG 
AAAACTGCTG 
AAAACAATCA 
ACGGTATATG 
GATGCAGTTT 
TACACTGGCC 
AGTATCACAA 
GGAGTATACC 
CGCAGCTTGA 



31 
I 

CAGGATAGAA 
GGCTCTTCCC 
GAGAATTGCG 
CTAAAAGAAG 
ATAACTCAAA 
TCACCTACCG 
ACAAAAACAC 
TCCTGATCAC 
TAACGGTTAA 
TGGGTGAAAT 
ATGCAGATGA 
CAGCAGGCAC 
ATTCTCTTGA 
ATGGAGAAGG 
ACTTCCCAAT 
CTGAATTACT 
CAGTATATTT 
GAACTAATGA 
TGAAACTTAG 
ACCGAGTTCA 
TCCGTCCTGC 
ATTATATCCT 
TCAAATATGT 
AAATCAAATT 
CAGCTGAGGT 
TTAGAGTACC 
GCAGTTCTTC 
CCTATACATT 
CCCTCAATGC 
ACATCTCCCT 
CACTGGAAGT 



41 
I 

GCAGCGGCTC 
CAGAACTACA 
AATAGAGACT 
GCAAAAACGT 
AAGAAACCCA 
AATCTCTGGA 
TGGAGATATT 
ATGTCGGGCT 
AATTTTGGAT 
TGAAGAAAAT 
ACCAAACCAC 
ACCCATGTTC 
CCGAGAGCAA 
ACTATCAACT 
GTTTAGAGAC 
TCGATTTCAA 
CTTTACCTCT 
AGGCATCCTG 
TATTGCTGTC 
GTCAACCCCA 
TTCCAAGACA 
GGGAACATAT 
CATGGGACGT 
TGTCAAAAAT 
TCTGGCCATA 
CGATTT CAAT 
ACCTTCCGTG 
TGCACTGGAA 
TACCTCGGCC 
GGTACTTACA 
CTGTCAGTGT 



51 
I 

ACTTGGACTT 
GGGGCTCTGG 
AAAGGTCAAT 
GAATGGGTGA 
ATTGCCAAGA 
GTGGGAATCG 
AACATAACAG 
CTAAATGCCC 
ATTAATGATA 
AGTGCCTCAA 
TTGAATTCTA 
CTCCTAAGCA 
GCTAGCAGCT 
CAATGTGAAT 
TCTCAGTATT 
GTAACAGATT 
GGGAATGAAG 
AAAGTGGTGA 
AAAAACAAAG 
GTCACAATTC 
TTTACTGTGC 
CAAGCCATCG 
AACGATGGTG 
ATGAACCGAG 
GATGAATACA 
GACAATTGTC 
GTTGTCTCCG 
GATCAACCTG 
CTCCTCAGAG 
GACAGTCAGA 
GACAACAGGG 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 



60 
* 120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 



384 
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GCATCTGTGG AACTTCTTAC CCAACCACAA GCCCTGGGAC CAGGTATGGC AGGCCGCACT 
CAGGGAGGCT GGGGCCTGCC GCCATCGGCC TGCTGCTCCT TGGTCTCCTG CTGCTGCTGT 
TGGCCCCCCT TCTGCTGTTG ACCTGTGACT GTGGGGCAGG TTCTACTGGG GGAGTGACAG 
GTGGTTTTAT CCCAGTTCCT GATGGCTCAG AAGGAACAAT TCATCAGTGG GGAATTGAAG 
GAGCCCATCC TGAAGACAAG GAAATCACAA ATATTTGTGT GCCTCCTGTA ACAGCCAATG 
GAGCCGATTT CATGGAAAGT TCTGAAGTTT GTACAAATAC GTATGCCAGA GGCACAGCGG 
TGGAAGGCAC TTCAGGAATG GAAATGACCA CTAAGCTTGG AGCAGCCACT GAATCTGGAG 
GTGCTGCAGG CTTTGCAACA GGGACAGTGT CAGGAGCTGC TTCAGGATTC GGAGCAGCCA 
CTGGAGTTGG CATCTGTTCC TCAGGGCAGT CTGGAACCAT GAGAACAAGG CATTCCACTG 
GAGGAACCAA TAAGGACTAC GCTGATGGGG CGATAAGCAT GAATTTTCTG GACTCCTACT 
TTTCTCAGAA AGCATTTGCC TGTGCGGAGG AAGACGATGG CCAGGAAGCA AATGACTGCT 
TGTTGATCTA TGATAATGAA GGCGCAGATG CCACTGGTTC TCCTGTGGGC TCCGTGGGTT 
GTTGCAGTTT TATTGCTGAT GACCTGGATG ACAGCTTCTT GGACTCACTT GGACCCAAAT 
TTAAAAAACT TG C AG AG AT A AGCCTTGGTG TTGATGGTGA AGGCAAAGAA GTTCAGCCAC 
CCTCTAAAGA CAGCGGTTAT GGGATTGAAT CCTGTGGCCA TCCCATAGAA GTCCAGCAGA 
CAGGATTTGT TAAGTGCCAG ACTTTGTCAG GAAGTCAAGG AGCTTCTGCT TTGT CCGCCT 
CTGGGTCTGT CCAGCCAGCT GTTTCCATCC CTGACCCTCT GCAGCATGGT AACTATTTAG 
TAACGGAGAC TTACTCGGCT TCTGGTTCCC TCGTGCAACC TTCCACTGCA GGCTTTGATC 
CACTTCTCAC ACAAAATGTG ATAGTGACAG AAAGGGTGAT CTGTCCGATT TCCAGTGTTC 
CTGGCAACCT AGCTGGCCCA ACGCAGCTAC GAGGGTCACA TACTATGCTC TGTACAGAGG 
ATCCTTGCTC CCGTCTAATA TGACCAGAAT GAGCTGGAAT ACCACACTGA CCAAATCTGG 
ATCTTTGGAC TAAAGTATTC AAAATAGCAT AGCAAAGCTC ACTGT AT TGG GCTAATAATT 
TGGCACTTAT TAGCTTCTCT CATAAACTGA TCACGATTAT AAAT TAAATG TTTGGGTTCA 
TACCCCAAAA GCAATATGTT GTCACTCCTA ATTCTCAAGT ACT AT T C AAA TTGTAGTAAA 
TCTTAAAGTT TTTCAAAACC CTAAAATCAT ATTCGC 

Seq ID NO: 52 3 Protein sequence 
Protein Accession #: NP_0 01935.1 

1 11 21 31 41 51 

I 1 I I I I 

MMGLFPRTTG alaifvwil vhgelrietk gqydeeemtm qqakrrqkre wvkfakpcre 

GEDNSKRNPI AKITSDYQAT QKITYRISGV GIDQPPFGIF WDKNTGD IN ITAIVDREET 
PSFLITCRAL NAQGLDVEKP LILTVKILDI NDNPPVFSQQ IFMGEIEENS ASNSLVMILN 
ATDADEPNHL NSKIAFKIVS QEPAGTPMFIj LSRNTGEVRT LTNSLDREQA SSYRLWSGA 
DKDGEGLSTQ CECNIKVKDV NDNFPMFRDS QYSARIEENI LSSELLRFQV TDLDEEYTDN 
WLAVYFFTSG NEGNWFEIQT DPRTNEGILK WKALDYEQL QSVKLSIAVK NKAEFHQSVI 
SRYRVQSTPV TIQVINVREG IAFRPASKTF TVQKGISSKK LVDYILGTYQ AIDEDTNKAA 
SNVKYVMGRN DGGYLMIDSK TAEIKFVKNM NRDSTFIVNK TITAEVLAID EYTGKTSTGT 
VYVRVPDFND NCPTAVLEKD AVCSSSPSW VSARTLNNRY TGPYTFALED QPVKLPAVWS 
ITTLNATSAL LRAQEQIPPG VYHISLVLTD SQNNRCEMPR SLTLEVCQCD NRGICGTSYP 
TTSPGTRYGR PHSGRLGPAA IGLLLLGLLIi LLLAPLLLLT CDCGAGSTGG VTGGFIPVPD 
GSEGTIHQWG I EGAHPEDKE ITNICVPPVT ANGADFMESS EVCTNTYARG TAVEGT SGME 
MTTKLGAATE SGGAAGFATG TVSGAASGFG AATGVGICSS GQSGTMRTRH STGGTNKDYA 
DGAI SMNFLD SYFSQKAFAC AEEDDGQEAN DCLLIYDNEG ADATGSPVGS VGCCSFIADD 
LDDSFLDSLG PKFKKLAEIS LGVDGEGKEV QPPSKDSGYG IESCGHPIEV QQTGFVKCQT 
LSGSQGASAL SASGSVQPAV SIPDPLQHGN YLVTETYSAS GSLVQPSTAG FDPLLTQNVI 
VTERVICPIS SVPGNLAGPT QLRGSHTMLC TEDPCSRLI 

Seq ID NO: 524 DNA sequence 

Nucleic Acid Accession #: XM_058069.2 

Coding sequence : 1 . . 1413 

1 11 21 31 41 51 

l l I l l > 

ATGAAGTTTC TTCTAATACT GCTCCTGCAG GCCACTGCTT CTGGAGCTCT TCCCCTGAAC 
AGCTCTACAA GCCTGGAAAA AAATAATGTG CTATTTGGTG AAAGATACTT AGAAAAATTT 
TATGGCCTTG AGATAAACAA ACTTCCAGTG ACAAAAATGA AATATAGTGG AAACTTAATG 
AAGGAAAAAA TCCAAGAAAT GCAGCACTTC TTGGGTCTGA AAGTGACCGG GCAACTGGAC 
ACATCTACCC TGGAGATGAT GCACGCACCT CGATGTGGAG TCCCCGATGT CCATCATTTC 
AGGGAAATGC CAGGGGGGCC CGTATGGAGG AAACATTATA TCACCTACAG AATCAATAAT 
TACACACCTG ACATGAACCG TGAGGATGTT GACTACGCAA TCCGGAAAGC TTTCCAAGTA 
TGGAGTAATG TTACCCCCTT GAAATTCAGC AAGAT TAAC A CAGGCATGGC TGACATTTTG 
GTGGTTTTTG CCCGTGGAGC TCATGGAGAC TTCCATGCTT TTGATGGCAA AGGTGGAATC 
CTAGCCCATG CTTTTGGACC TGGATCTGGC AT TGG AGGGG ATGCACATTT CGATGAGGAC 
GAATTCTGGA CTACACATTC AGGAGGCACA AACTTGTTCC TCACTGCTGT TCACGAGATT 
GGCCATTCCT TAGGTCTTGG CCATTCTAGT GATCCAAAGG CCGTAATGTT CCCCACCTAC 
AAATATGTTG ACATCAACAC ATTTCGCCTC TCTGCTGATG ACATACGTGG CATTCAGTCC 
CTGTATGGAG ACCCAAAAGA GAACCAACGC TTGCCAAATC CTGACAATTC AGAACCAGCT 
CTCTGTGACC CCAATTTGAG TTTTGATGCT GTCACTACCG TGGGAAATAA GATCTTTTTC 
TTCAAAGACA GGTTCTTCTG GCTGAAGGTT TCTGAGAGAC CAAAGACCAG TGTTAATTTA 
ATTTCTTCCT TATGGCCAAC CTTGCCATCT GGCATTGAAG CTGCTTATGA AATTGAAGCC 
AGAAATCAAG TTTTTCTTTT TAAAGATGAC AAATACTGGT TAAT TAGCAA TTTAAGACCA 
GAGCCAAATT ATCCCAAGAG CATACATTCT TTTGGTTTTC CTAACTTTGT GAAAAAAATT 
GATGCAGCTG TTTTTAACCC ACGTTTTTAT AGGACCTACT TCTTTGTAGA TAACCAGTAT 
TGGAGGTATG ATGAAAGGAG ACAGATGATG GACCCTGGTT ATCCCAAACT GATTACCAAG 
AACTTCCAAG GAATCGGGCC TAAAATTGAT GCAGTCTTCT ACTCTAAAAA CAAATACTAC 
TATTTCTTCC AAGGATCTAA CCAATTTGAA TATGACTTCC TACT CCAACG TATCACCAAA 
ACACTGAAAA GCAATAG CTG GTTTGGTTGT TGA 

Seq ID NO: 525 Protein sequence 
Protein Accession #: P39900 

1 11 21 31 41 51 

l l l l l l 

MKFIjIjIIjLLQ ATASGALPLN SSTSLEKNNV LFGERYLEKF YGLEINKLPV TKMKYSGNLM 
KEKIQEMQHF LGLKVTGQLD TSTLEMMHAP RCGVPDVHHF REMPGGPVWR KHYITYRINN 
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YTPDMNREDV DYAIRKAFQV WSNVTPLKFS KINTGMADIL WPARGAHGD FHAFDGKGGI 180 

LAHAFGPGSG I GGDAHFDED EFWTTHSGGT NLFLTAVHEI GHSLGLGHSS DPKAVMFPTY 240 

KYVDINTFRL SADDIRGIQS LYGDPKENQR LPNPDNSEPA LCDPNLSFDA VTTVGNKIFF 300 

FKDRFFWLKV SERPKTSVNL ISSLWPTLPS GIEAAYEIEA RNQVFLFKDD KYWLISNLRP 3 60 

5 EPNYPKSIHS FGFPNFVKKI DAAVFNPRFY RTYFFVDNQY WRYDERRQMM DPGYPKLITK 420 

NFQGIGPKID AVFYSKNKYY YFFQGSNQFE YDFLLQRITK TLKSNSWFGC 

Seq ID NO: 52 6 DNA sequence 
Nucleic Acid Accession #: NM_024423.1 
10 Coding sequence: 64.. 2590 

1 11 21 31 41 51 

l l l I I l 

GGCAGGTCTC GCTCTCGGCA CCCTCCCGGC GCCCGCGTTC TCCTGGCCCT GCCCGGCATC 60 

15 CCGATGGCCG CCGCTGGGCC CCGGCGCTCC GTGCGCGGAG CCGTCTGCCT GCATCTGCTG 120 

CTGACCCTCG TGATCTTCAG TCGTGATGGT GAAGCCTGCA AAAAGGTGAT ACTTAATGTA 180 

CCTTCTAAAC TAGAGGCAGA CAAAATAATT GGCAGAGTTA ATTTGGAAGA GTGCTTCAGG 240 

TCTGCAGACC TCATCCGGTC AAGTGATCCT GATTTCAGAG TTCTAAATGA TGGGT CAGTG 300 

TACACAGCCA GGGCTGTTGC GCTGT CTGAT AAGAAAAGAT CATTTACCAT ATGGCTTTCT 3 60 

20 GACAAAAGGA AACAGACACA GAAAGAGGTT ACTGTGCTGC TAGAACATCA GAAGAAGGTA 42 0 

TCGAAGACAA GACACACTAG AGAAACTGTT CTCAGGCGTG CCAAGAGGAG ATGGGCACCT 480 

ATTCCTTGCT CTATGCAAGA GAATTCCTTG GGCCCTTTCC CATTGTTTCT TCAACAAGTT 540 

GAATCTGATG CAGCACAGAA CTATACTGTC TTCTACTCAA TAAGTGGACG TGGAGTTGAT 600 

AAAGAACCTT TAAATTTGTT TTATATAGAA AGAGACACTG GAAATCTATT TTGCACTCGG 660 

25 CCTGTGGATC GTGAAGAATA TGATGTTTTT GATTTGATTG CTTATGCGTC AACTGCAGAT 720 

GGATATTCAG CAGAT CTGCC CCTCCCACTA CCCATCAGGG TAGAGGATGA AAATGACAAC 780 

CACCCTGTTT TCACAGAAGC AATTTATAAT TTTGAAGTTT TGGAAAGTAG TAGACCTGGT 840 

ACTACAGTGG GGGTGGTTTG TGCCACAGAC AGAGATGAAC CGGACACAAT GCATACGCGC 900 

CTGAAATACA GCATTTTGCA GCAGACACCA AGGTCACCTG GGCTCTTTTC TGTGCATCCC 960 

30 AGCACAGGCG TAAT CACCAC AGTCTCTCAT TATTTGGACA GAGAGGTTGT AGACAAGTAC 1020 

TCATTGATAA TGAAAGTACA AGACATGGAT GGCCAGTTTT TTGGATTGAT AGGCACATCA 10 80 

ACTTGTATCA TAACAGTAAC AG ATT CAAAT GATAATGCAC CCACT TTCAG ACAAAATGCT 1140 

TATGAAGCAT TTGTAGAGGA AAATGCATTC AATGTGGAAA TCTTACGAAT ACCTATAGAA 12 0 0 

GATAAGGATT TAATTAACAC TGCCAATTGG AGAGTCAATT TTACCATTTT AAAGGGAAAT 1260 

35 GAAAATGGAC ATTT CAAAAT C AG CACAGAC AAAGAAACTA ATGAAGGTGT TCTTTCTGTT 13 20 

GTAAAGCCAC TGAATTATGA AGAAAACCGT CAAGTGAACC TGGAAATTGG AGTAAACAAT 13 80 

GAAGCGCCAT TTGCTAGAGA TAT TCCCAGA GTGACAGCCT TGAACAGAGC CTTGGTTACA 1440 

GTTCATGTGA GGGATCTGGA TGAGGGGCCT GAATGCACTC CTGCAGCCCA AT AT GTGCGG 1500 

ATTAAAGAAA ACTTAGCAGT GGGGTCAAAG ATCAACGGCT ATAAGGCATA TGACCCCGAA 1560 

40 AATAGAAATG GCAATGGTTT AAGGTACAAA AAATTGCATG ATCCTAAAGG TTGGATCACC 1620 

ATTGATGAAA TTTCAGGGTC AATCATAACT TCCAAAATCC TGGATAGGGA GGTTGAAACT 1680 

CCCAAAAATG AGTTGTATAA TATTACAGTC CTGGCAATAG ACAAAGATGA TAGATCATGT 1740 

ACTGGAACAC TTGCTGTGAA CATTGAAGAT GTAAATGATA ATCCACCAGA AATACTTCAA 180 0 

GAATATGTAG TCATTTGCAA ACCAAAAATG GGGTATACCG ACATTTTAGC TGTTGATCCT 1860 

45 GATGAACCTG TCCATGGAGC TCCATTTTAT TTCAGTTTGC CCAATACTTC TCCAGAAATC 192 0 

AGTAGACTGT GGAGCCTCAC CAAAGTTAAT GATACAGCTG CCCGTCTTTC AT AT CAG AAA 1980 

AATGCTGGAT TTCAAGAATA TACCATTCCT ATTACTGTAA AAGACAGGGC CGGCCAAGCT 2 040 

G CAA CAAAAT TATTGAGAGT TAATCTGTGT GAATGTACTC ATCCAACTCA GTGTCGTGCG 2100 

ACTTCAAGGA GTACAGGAGT AATACTTGGA AAATGGGCAA TCCTTGCAAT AT T ACTGGGT 2160 

50 ATAGCACTGC TCTTTTCTGT ATTGCTAACT TTAGTATGTG GAGTTTTTGG TGCAACTAAA 2220 

GGGAAACGTT TTCCTGAAGA TTTAGCACAG CAAAACTTAA TTATATCAAA CACAGAAGCA 2280 

CCTGGAGACG ATAGAGTGTG CTCTGCCAAT GGATTTATGA CCCAAACTAC CAACAACTCT 2340 

AGCCAAGGTT TTTGTGGTAC TATGGGATCA GGAATGAAAA ATGGAGGGCA GGAAACCATT 2400 

GAAATGATGA AAGGAGGAAA CCAGACCTTG GAATCCTGCC GGGGGGCTGG GCATCATCAT 2460 

55 ACCCTGGACT CCTGCAGGGG AGGACACACG GAGGTGGACA ACTGCAGATA CACTTACTCG 2520 

GAGTGGCACA GTTTTACTCA ACCCCGTCTC GGTGAAGAAT CCATTAGAGG ACACACTGGT 2580 

TAAAAATTAA ACATAAAAGA AATTGCATCG ATGTAAT CAG AATGAAGACC GCATGCCATC 2640 

CCAAGATTAT GTCCTCACTT ATAACTATGA GGGAAGAGGA TCTCCAGCTG GTTCTGTGGG 2700 

CTGCTGCAGT GAAAAGCAGG AAGAAGATGG CCTTGACTTT TTAAATAATT TGGAACCCAA 2760 

60 ATTTATTACA TTAG CAGAAG CATG C AC AAA GAGATAATGT CACAGTGCTA CAATTAGGTC 2 82 0 

TTTGTCAGAC ATTCTGGAGG TTTCCAAAAA TAATATTGTA AAGTTCAATT TCAACATGTA 2 880 

TGTATATGAT GATTTTTTTC TCAATTTTGA ATTATGCTAC TCACCAATTT ATATTTTTAA 2 940 

AGCCAGTTGT TGCTTATCTT TTCCAAAAAG TGAAAAATGT TAAAACAGAC AACTGGTAAA 3000 

TCTCAAACTC CAGCACTGGA ATTAAGGTCT CTAAAGCATC TGCTCTTTTT TTTTTTTACG 3060 

65 GATATTTTAG TAATAAATAT GCTGGATAAA TATTAGTCCA ACAATAGCTA AGTTATGCTA 3120 

ATATCACATT ATTATGTATT CACTTTAAGT GATAGTTTAA AAAATAAACA AGAAATATTG 3180 

AGTATCACTA TGTGAAGAAA GTTTTGGAAA AGAAACAATG AAGACTGAAT TAAATTAAAA 3240 

ATGTTGCAGC TCATAAAGAA TTGGGACTCA CCCCTACTGC ACTACCAAAT TCATTTGACT 3300 

TTGGAGGCAA AATGTGTTGA AGTGCCCTAT GAAGTAGCAA TTTTCTATAG GAATATAGTT 3 3 60 

70 GGAAATAAAT GTGTGTGTGT ATATTATTAT TAATCAATGC AATATTTAAA AT G AAATG AG 3420 

AACAAAGAGG AAAATGGTAA AAACTTGAAA TGAGGCTGGG GTATAGTTTG TCCTACAATA 3 480 

GAAAAAAGAG AGAGCTTCCT AGGCCTGGGC TCTTAAATGC TGCATTATAA CTGAGTCTAT 3 540 

GAGGAAATAG TTCCTGTCCA ATTTGTGTAA TTTGTTTAAA ATTGTAAATA AATTAAACTT 3600 

TTCTGGTTTC TGTGGGAAGG AAATAGGGAA TCCAATGGAA CAGTAGCTTT GCTTTGCAGT 3660 

75 CTGTTTCAAG ATTTCTGCAT CCACAAGTTA GTAGCAAACT GGGGAATACT CGCTGCAGCT 3720 

GGGGTTCCCT GCTTTTTGGT AGCAAGGGTC CAGAGATGAG GTGTTTTTTT CGGGGAGCTA 3780 

ATAACAAAAA CATTTTAAAA CTTACCTTTA CTGAAGTTAA ATCCTCTATT GCTGTTTCTA 3 840 

TTCTCTCTTA TAGTGACCAA CATCTTTTTA AT T TAG AT C C AAAT AAC CAT GTCCTCCTAG 3 90 0 

AGTTTAGAGG CTAGAGGGAG CTGAGGGGAG GAT CTTACTG AAAGCACCCT GGGGAGATTG 3960 

80 ATTGTCCTTA AACCTAAGCC CCACAAACTT GACACCTGAT CAGGTCTGGG AGCTACAAAA 4020 

TTTCATTTTT CTCCTCACTG CCCTTCTTCT GAGTGGCATT GGCCTGAATC AAGGAAAGCC 4080 

AGGCCTTGTG GGCCCCCTTC TTTCGGCTTT CTGCTAAAGC AACACCTCCA GCAGAGATTC 4140 

CCTTAAGTGA CTCCAGGTTT TCCACCATCC TTCAGCGTGA ATTAATTTTT AATCAGTTTG 42 00 

CTTTCTCCAG AGAAATTTTA AAATAATAGA AGAAATAGAA ATTTTGAATG TATAAAAGAA 42 60 

85 AAAGATCAAG TTGTCATTTT AGAACAGAGG GAACTTTGGG AGAAAGCAGC CCAAGTAGGT 4320 

TATTTGTACA GTCAGAGGGC AACAGGAAGA TGCAGGCCTT CAAGGGCAAG GAGAGGCCAC 4380 

AAGGAATATG GGTGGGAGTA AAAGCAACAT CGTCTGCTTC ATACTTTTTC CTAGGCTTGG 4440 
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CACTGCCTTT TCCTTTCTCA GGCCAATGGC AACTGCCATT TGAGTCCGGT GAGGGATCAG 450 0 

CCAACCTCTT CTCTATGGCT CACCTTATTT GGAGTGAGAA AT CAAGGAGA CAGAGCTGAC 4560 

TGCATGATGA GTCTGAAGGC ATTTGCAGGA TGAGCCTGAA CTGGTTGTGC AGAACAAACA 462 0 

AGGCATTCAT GGGAATTGTT GTATTCCTTC TGCAGCCCTC CTTCTGGGCA CTAAGAAGGT 4680 

CTATGAATTA AATGCCTATC TAAAATTCTG ATTTATTCCT ACATTTTCTG TTTTCTAATT 4740 

TGACCCTAAA AT CTATGTGT TTTAGACTTA GACTTTTTAT TGCCCCCCCC CCCTTTTTTT 4800 

TTGAGACGGA GTCTCGCTCT GACGCACAGG CTGGAGTGCA GTGGCTCCGA TCTCTGCTCA 4860 

CTGAAAGCTC CGCCTCCCGG GTTCATGCCA TTCTCCTGCC TCAGCCTCCT GAGTAGCTGG 492 0 

GACTAGAGGC GCCCACCACC ACGCCCGGCT AATTTTTTGT ATTTTTAATA GAGACGGGGT 4980 

TTCACTGTGT TAGCCAGGAT GGTCTCGATC TCCTGACCTC GTGATCCGCC TGCCTCGGCC 5040 

TCCCAAAGTG CTGGGATTAC AGGCATGACC CACCGCTCCC GGCCTTGTTT TCCGTTTAAA 5100 

GTCGTCTTCT TTTAATGTAA TCATTTTGAA CATGTGTGAA AGTTGAT CAT ACGAATTGGA 5160 

TCAATCTTGA AATACTCAAC CAAAAGACAG TCGAGAAGCC AGGGGGAGAA AGAACTCAGG 522 0 

GCACAAAATA TTGGTCTGAG AATGGAATTC TCTGTAAGCC TAGTTGCTGA AATTTCCTGC 5280 

TGTAACCAGA AGCCAGTTTT ATCTAACGGC TACTGAAACA CCCACTGTGT TTTGCTCACT 5340 

CCCACTCACC GAT CAAAACC TGCTACCTCC CCAAGACTTT ACTAGTGCCG ATAAACTTTC 5400 

TCAAAGAGCA ACCAGTATCA CTTCCCTGTT TATAAAACCT CTAACCATCT CTTTGTTCTT 5460 

TGAACATGCT GAAAACCACC TGGTCTGCAT GTATGCCCGA ATTTGTAATT CTTTTCTCTC 552 0 

AAATGAAAAT TTAATTTTAG GGATTCATTT CTATATTTTC ACATATGTAG TATTATTATT 5580 

TCCTTATATG TGTAAGGTGA AATTTATGGT ATTTGAGTGT GCAAGAAAAT ATATTTTTAA 5640 

AGCTTTCATT TTTCCCCCAG TGAATGATTT AGAATTTTTT ATGTAAATAT ACAGAATGTT 570 0 

TTTTCTTACT TTTATAAGGA AGCAGCTGTC TAAAATGCAG TGGGGTTTGT TTTGCAATGT 5 760 

TTTAAACAGA GTTTTAGTAT TGCTATTAAA AGAAGTTACT TTGCTTTTAA AGAAACTTGG 582 0 

CTGCTTAAAA TAAGCAAAAA TTGGATGCAT AAAGTAATAT TTACAGATGT GGGGAGATGT 5880 

AATAAAACAA TATTAACTTG GCTGCTTAAA ATAAGCAAAA ATTGGATGCA TAAAGTAATA 5 940 

TTTACAGATG TGGGGAGATG TAATAAAACA ATATTAACTT GGTTTCTTGT TTTTGCTGTA 600 0 

TTTAGAGATT - AAATAATTCT AAGATGATCA CTTTGCAAAA TTATGCTTAT GGCTGGCATG 6060 

GAAATAGAAA TACTCAATTA TGTCTTTGTT GTATTAATGG GGAATATTTT GGACAATGTT 612 0 

TCATTAT CAA ATTGTCGACA TCATTAATAT ATATTGTAAT GTTGGGAAGA GATCACTATT 6180 

TTGAAGCACA GCTTTACAGA TGAGTATCTA TGATACATAT GTATAATAAA TTTTGATCGG 6240 

GTATTAAAAG TATTAGAAGG TGGTTATAAT TGCAGAGTAT TCCATGAATA GTACACTGAC 63 00 

ACAGGGGTTT TACTTTGAGG ACCAGTGTAG TCAAGGGAAA ACATGAGTTA AAAAGAAAAG 63 60 

CAGGCAATAT TGCAGTCTTG ATTCTGCCAC TTACAGGATA GATAATGCCT GAACTTTAAT 642 0 

GACAAGATGA T CCAACC ATA AAGGTGCTCT GTGCTTCACA GTGAATCTTT TCCCCATGCA 6480 

GGAGTGTGCT CCCCTACAAA CGTTAAGACT GATCATTTCA AAAAT CTATT AGCTATATCA 6540 

AAAGCCTTAC ATTTTAATAT AGGTTGAACC AAAATTT CAA TTCCAGTAAC TTCTATTGTA 6600 

ACCATTATTT TTGTGTATGT CTTCAAGAAT GTTCATTGGA TTTTTGTTTG TAATAGTAAA 6660 

ATACCGGATA CATTTCACGT GTCCTTCAGT ATTGATTTGG TTGAATATTG GGT CAT AAT G 672 0 

GTTGAGAAGC ATGGACACTA GAGCCAGAAT GCTTGGATAT GAATCCTGGA TCTGTCACTT 6780 

ACTTCTGTGT GACCTTTGAA AGGCTACTTA TTTCCTCTCT TAGCTTTCTC ATT AAAAT CA 6840 

ATGAACAATG CCAGCCTCAT GGGGTTGTTG AATGATTAAA TTAGTTAATA TACCTAAAGT 6900 

ACATAGAACA CTGCCTGCAC ATAGTAAAAG AATTATAAGT GTGAGGTAGT TGGTAAAATT 6 960 

ATGTAGTTGG ATATACTACC GAACAATATC TAATCTCTTT TTAGGGAAAT AAAGTTTGTG 7020 
CATATATATA ATCCCGAAAC ATG 

Seq ID NO: 527 Protein sequence 
Protein Accession #: NP_077741.1 

1 11 21 31 41 51 

I I I 1 I I 

MAAAGPRRSV RGAVCLHLLL TLVIPSRDGE ACKKVILNVP SKLEADKIIG RVNLEECFRS 60 

ADLIRSSDPD FRVLNDGSVY TARAVALSDK KRSFTIWLSD KRKQTQKEVT VLLEHQKKVS 120 

KTRHTRETVL RRAKRRWAP I PCSMQENSLG PFPLFLQQVE SDAAQNYTVF YSISGRGVDK 180 

EPLNLFYIER DTGNLFCTRP VDREEYDVFD LIAYASTADG YSADLPLPLP IRVEDENDNH 240 

PVFTEAIYNF EVLESSRPGT TVGWCATDR DEPDTMHTRL KYSILQQTPR SPGLFSVHPS 3 00 

TGVITTVSHY LDREWDKYS LIMKVQDMDG QFFGLIGTST CIITVTDSND NAPT FRQNAY 3 60 

EAFVEENAFN VEILRIPIED KDLINTANWR VNFTILKGNE NGHFKISTDK ETNEGVLSW 420 

KPLNYEENRQ VNLEIGVNNE APFARDIPRV TALNRALVTV HVRDLDEGPE CTPAAQYVRI 480 

KENLAVGSKI NGYKAYDPEN RNGNGLRYKK LHDPKGWITI DEISGSIITS KILDREVETP 540 

KNELYNITVL AIDKDDRSCT GTLAVNIEDV NDNPPEILQE YWICKPKMG YTDILAVDPD 600 

EPVHGAPFYF SLPNTSPEIS RLWSLTKVND TAARLSYQKN AGFQEYTIPI TVKDRAGQAA 660 

TKLLRVNLCE CTHPTQCRAT SRSTGVILGK WAILAILLGI ALLFSVLLTL VCGVFGATKG 72 0 

KRFPEDLAQQ NLIISNTEAP GDDRVCSANG FMTQTTNNSS QGFCGTMGSG MKNGGQETIE 780 
MMKGGNQTLE SCRGAGHHHT LDSCRGGHTE VDNCRYTYSE WHSFTQPRLG EESIRGHTG 

Seq ID NO: 528 DNA sequence 

Nucleic Acid Accession #: NMJ301941.2 

Coding sequence: 64. .2754 

1 11 21 31 41 51 

I I 1 I I I 

GGCAGGTCTC GCTCTCGGCA CCCTCCCGGC GCCCGCGTTC TCCTGGCCCT GCCCGGCATC 60 

CCGATGGCCG CCGCTGGGCC CCGGCGCTCC GTGCGCGGAG CCGTCTGCCT GCATCTGCTG 120 

CTGACCCTCG TGATCTTCAG TCGTGATGGT GAAGCCTGCA AAAAGGT GAT ACTTAATGTA 180 

CCTTCTAAAC TAGAGGCAGA CAAAATAATT GGCAGAGTTA ATTTGGAAGA GTGCTTCAGG 240 

TCTGCAGACC TCATCCGGTC AAGTGATCCT GATTTCAGAG TTCTAAATGA TGGGTCAGTG 3 00 

TACACAGCCA GGGCTGTTGC GCTGTCTGAT AAGAAAAGAT CATTTACCAT ATGGCTTTCT 360 

GACAAAAGGA AACAGACACA GAAAGAGGTT ACTGTGCTGC T AGAACAT CA GAAGAAGGTA 420 

TCGAAGACAA GACACACTAG AGAAACTGTT CTCAGGCGTG CCAAGAGGAG ATGGGCACCT 480 

ATTCCTTGCT CTATGCAAGA GAATT CCTTG GGCCCTTTCC CATTGTTTCT TCAACAAGTT 540 

GAATCTGATG CAGCACAGAA CTATACTGTC TTCTACTCAA TAAGTGGACG TGGAGTTGAT 600 

AAAGAACCTT TAAATTTGTT TTATATAGAA AGAGACACTG GAAATCTATT TTGCACTCGG 660 

CCTGTGGATC GTGAAGAATA TGATGTTTTT GATTTGATTG CTTATGCGTC AACTGCAGAT 72 0 

GGATATTCAG CAGATCTGCC CCTCCCACTA CCCATCAGGG TAGAGGATGA AAATGACAAC 780 

CACCCTGTTT TCACAGAAGC AATTTATAAT TTTGAAGTTT TGGAAAGTAG TAGACCTGGT 840 

ACTACAGTGG GGGTGGTTTG TGCCACAGAC AGAGATGAAC CGGACACAAT GCATACGCGC 900 

CTGAAATACA GCATTTTGCA GCAGACACCA AGGTCACCTG GGCTCTTTTC TGTGCATCCC 960 
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AGCACAGGCG TAATCACCAC 
TCATTGATAA TGAAAGTACA 
ACTTGTATCA TAACAGTAAC 
TATGAAGCAT TTGTAGAGGA 
5 GATAAGGATT TAATTAACAC 

GAAAATGGAC ATTT CAAAAT 
GTAAAGCCAC TGAATTATGA 
GAAGCGCCAT TTGCTAGAGA 
GTT CATGTGA GGGATCTGGA 
10 ATTAAAGAAA ACTTAGCAGT 

AATAGAAATG GCAATGGTTT 
ATTGATGAAA TTTCAGGGTC 
CCCAAAAATG AGTTGTATAA 
ACTGGAACAC TTGCTGTGAA 
GAATATGTAG TCATTTGCAA 
GATGAACCTG TCCATGGAGC 
AGTAGACTGT GGAGCCTCAC 
AATGCTGGAT TTCAAGAATA 
GCAACAAAAT TATTGAGAGT 
ACTTCAAGGA GTACAGGAGT 
ATAGCACTGC TCTTTTCTGT 
GGGAAACGTT TTCCTGAAGA 
CCTGGAGACG ATAGAGTGTG 
AGCCAAGGTT TTTGTGGTAC 
25 GAAATGATGA AAGGAGGAAA 

ACCCTGGACT CCTGCAGGGG 
GAGTGGCACA GTTTTACTCA 
GAAGACCGCA TGCCATCCCA 
CCAGCTGGTT CTGTGGGCTG 
30 AATAATTTGG AACCCAAATT 

AGTGCTACAA TTAGGTCTTT 
TTCAATTTCA ACATGTATGT 
CCAATTTATA TTTTTAAAGC 
AA.CAGACAAC TGGTAAATCT 
35 TCTTTTTTTT TTTTACGGAT 

ATAGCTAAGT TATGCTAATA 
ATAAACAAGA AATATTGAGT 
ACTGAATTAA ATTAAAAATG 
ACCAAATTCA TTTGACTTTG 
40 TCTATAGGAA TATAGTTGGA 

ATTTAAAATG AAATGAGAAC 
TAGTTTGTCC TACAATAGAA 
ATTATAACTG AGTCTATGAG 
GTAAATAAAT TAAACTTTTC 
45 TAGCTTTGCT TTGCAGTCTG 

GAATACTCGC TGCAGCTGGG 
TTTTTTTCGG GGAGCTAATA 
CTCTATTGCT GTTTCTATTC 
TAACCATGTC CTCCTAGAGT 
50 GCACCCTGGG GAGATTGATT 

GTCTGGGAGC TACAAAATTT 
CTGAATCAAG GAAAGCCAGG 
ACCTCCAGCA GAGATTCCCT 
AATTTTTAAT CAGTTTGCTT 
55 TTGAATGTAT AAAAGAAAAA 

AAGCAGCCCA AGTAGGTTAT 
GGGCAAGGAG AGGCCACAAG 
CTTTTTCCTA GGCTTGGCAC 
GTCCGGTGAG GGATCAGCCA 
60 AAGGAGACAG AGCTGACTGC 
GTTGTGCAGA ACAAACAAGG 
CTGGGCACTA AGAAGGTCTA 
TTTTCTGTTT TCTAATTTGA 
CCCCCCCCCC TTTTTTTTTG 
65 GCTCCGATCT CTGCTCACTG 

GCCTCCTGAG TAGCTGGGAC 
TTTAATAGAG ACGGGGTTTC 
ATCCGCCTGC CTCGGCCTCC 
CTTGTTTTCC GTTTAAAGTC 
70 TG AT CAT ACG AATTGGATCA 

GGGAGAAAGA ACTCAGGGCA 
TTGCTGAAAT TTCCTGCTGT 
ACTGTGTTTT GCTCACTCCC 
CTAGTGCCGA TAAACTTTCT 
TAACCATCTC TTTGTTCTTT 
TTTGTAATTC TTTTCTCTCA 
CATATGTAGT ATTATTATTT 
CAAGAAAATA TATTTTTAAA 
TGTAAATATA CAGAATGTTT 
GGGGTTTGTT TTGCAATGTT 
TGCTTTTAAA GAAACTTGGC 
TACAGATGTG GGGAGATGTA 
TAGAGATTAA ATAATTCTAA 
AATAGAAATA CTCAATTATG 
85 ATTATCAAAT TGTCGACATC 

GAAGCACAGC TTTACAGATG 
ATTAAAAGTA TTAGAAGGTG 
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75 



80 



AGTCTCTCAT 
AGACATGGAT 
AGATTCAAAT 
AAATGCATTC 
TGCCAATTGG 
CAGCACAGAC 
AGAAAACCGT 
TATTCCCAGA 
TGAGGGGCCT 
GGGGT CAAAG 
AAGGTACAAA 
AATCATAACT 
TATTACAGTC 
CATTGAAGAT 
ACCAAAAATG 
TCCATTTTAT 
CAAAGTTAAT 
TACCATTCCT 
TAATCTGTGT 
AATACTTGGA 
ATTGCTAACT 
TTTAGCACAG 
CTCTGCCAAT 
TATGGGATCA 
CCAGACCTTG 
AGGACACACG 
ACCCCGTCTC 
AGATTATGTC 
CTGCAGTGAA 
TATTACATTA 
GTCAGACATT 
ATATGATGAT 
CAGTTGTTGC 
CAAACTCCAG 
ATTTTAGTAA 
TCACATTATT 
ATCACTATGT 
TTGCAGCTCA 
GAGGCAAAAT 
AATAAATGTG 
AAAGAGGAAA 
AAAAGAGAGA 
GAAATAGTTC 
TGGTTTCTGT 
TTTCAAGATT 
GTTCCCTGCT 
ACAAAAACAT 
TCTCTTATAG 
TTAGAGGCTA 
GTCCTTAAAC 
CATTTTTCTC 
CCTTGTGGGC 
TAAGTGACTC 
TCTCCAGAGA 
GAT CAAGTTG 
TTGTACAGTC 
GAATATGGGT 
TGCCTTTTCC 
ACCTCTTCTC 
ATGATGAGTC 
CATT CATGGG 
TGAATTAAAT 
CCCTAAAATC 
AGACGGAGTC 
AAAGCTCCGC 
TACAGGCGCC 
ACTGTGTTAG 
CAAAGTGCTG 
GTCTTCTTTT 
ATCTTGAAAT 
CAAAATATTG 
AACCAGAAGC 
TCACTCACCG 
CAAAG AG C AA 
GAACATGCTG 
AATGAAAATT 
CCTTATATGT 
GCTTTCATTT 
TTTCTTACTT 
TTAAACAGAG 
TGCTTAAAAT 
ATAAAACAAT 
GATGATCACT 
TCTTTGTTGT 
ATTAATATAT 
AGTATCTATG 
GTTATAATTG 



TATTTGGACA 
GGCCAGTTTT 
GATAATGCAC 
AATGTGGAAA 
AGAGTCAATT 
AAAGAAACTA 
CAAGTGAACC 
GTGACAGCCT 
GAATGCACTC 
ATCAACGGCT 
AAATTGCATG 
TCCAAAATCC 
CTGGCAATAG 
GTAAATGATA 
GGGTATACCG 
TTCAGTTTGC 
GATACAGCTG 
ATTACTGTAA 
GAATGTACTC 
AAATGGGCAA 
TTAGTATGTG 
CAAAACTTAA 
GGATTTATGA 
GGAATGAAAA 
GAATCCTGCC 
GAGGTGGACA 
GGTGAAAAAT 
CTCACTTATA 
AAGCAGGAAG 
GCAGAAGCAT 
CTGGAGGTTT 
TTTTTTCTCA 
TTATCTTTTC 
CACTGGAATT 
TAAATATGCT 
ATGTATTCAC 
GAAGAAAGTT 
TAAAGAATTG 
GTGTTGAAGT 
TGTGTGTATA 
ATGGTAAAAA 
GCTTCCTAGG 
CTGTCCAATT 
GGGAAGGAAA 
TCTGCATCCA 
TTTTGGTAGC 
TTTAAAACTT 
TGACCAACAT 
GAGGGAGCTG 
CTAAGCCCCA 
CTCACTGCCC 
CCCCTTCTTT 
CAGGTTTTCC 
AATTTTAAAA 
TCATTTTAGA 
AGAGGGCAAC 
GGGAGTAAAA 
TTTCTCAGGC 
TATGGCTCAC 
TGAAGGCATT 
AATTGTTGTA 
GCCTATCTAA 
TATGTGTTTT 
TCGCTCTGAC 
CTCCCGGGTT 
CACCACCACG 
CCAGGATGGT 
GGATTACAGG 
AATGTAATCA 
ACTCAACCAA 
GTCTGAGAAT 
CAGTTTTATC 
ATCAAAACCT 
CCAGTATCAC 
AAAACCACCT 
TAATTTTAGG 
GTAAGGTGAA 
TTCCCCCAGT 
TTATAAGGAA 
TTTTAGTATT 
AAGCAAAAAT 
ATTAACTTGG 
TTGCAAAATT 
ATTAATGGGG 
ATTGTAATGT 
ATACATATGT 
CAGAGTATTC 



GAGAGGTTGT 
TTGGATTGAT 
CCACTTTCAG 
TCTTACGAAT 
TTACCATTTT 
ATGAAGGTGT 
TGGAAATTGG 
TGAACAGAGC 
CTGCAGCCCA 
ATAAGGCATA 
ATCCTAAAGG 
TGGATAGGGA 
ACAAAGATGA 
ATCCACCAGA 
ACATTTTAGC 
CCAATACTTC 
CCCGTCTTTC 
AAGACAGGGC 
ATCCAACTCA 
TCCTTGCAAT 
GAGTTTTTGG 
TT ATAT C AAA 
CCCAAACTAC 
ATGGAGGGCA 
GGGGGGCTGG 
ACTGCAGATA 
TGCATCGATG 
ACTATGAGGG 
AAGATGGCCT 
GCACAAAGAG 
CCAAAAATAA 
ATTTTGAATT 
CAAAAAGTGA 
AAGGTCTCTA 
GGATAAATAT 
TTTAAGTGAT 
TTGGAAAAGA 
GGACTCACCC 
GCCCTATGAA 
TTATTATTAA 
CTTGAAATGA 
CCTGGGCTCT 
TGTGTAATTT 
TAGGGAATCC 
CAAGTTAGTA 
AAGGGTCCAG 
ACCTTTACTG 
CTTTTTAATT 
AGGGGAGGAT 
CAAACTTGAC 
TTCTTCTGAG 
CGGCTTTCTG 
ACCATCCTTC 
TAATAGAAGA 
ACAGAGGGAA 
AGGAAGATGC 
GCAACATCGT 
CAATGGCAAC 
CTTATTTGGA 
TGCAGGATGA 
TTCCTTCTGC 
AATTCTGATT 
AGACTTAGAC 
GCACAGGCTG 
CATGCCATTC 
CCCGGCTAAT 
CTCGATCTCC 
CATGACCCAC 
TTTTGAACAT 
AAGACAGTCG 
GGAATTCTCT 
TAACGGCTAC 
GCTACCTCCC 
TTCCCTGTTT 
GGTCTGCATG 
GATTCATTTC 
ATTTATGGTA 
GAATGATTTA 
GCAGCTGTCT 
GCTATTAAAA 
TGGATGCATA 
TTTCTTGTTT 
ATGCTTATGG 
AATATTTTGG 
TGGGAAGAGA 
ATAATAAATT 
CATGAATAGT 



AGACAAGTAC 1020 

AGGCACATCA 10 80 

ACAAAATGCT 1140 

ACCTATAGAA 12 00 

AAAGGGAAAT 1260 

TCTTTCTGTT 1320 

AGTAAACAAT 13 80 

CTTGGTTACA 1440 

ATATGTGCGG 1500 

TGACCCCGAA 1560 

TTGGAT CACC 1620 

GGTTGAAACT 1680 

TAGATCATGT 1740 

AATACTTCAA 1800 

TGTTGATCCT 1860 

TCCAGAAATC 192 0 

ATATCAGAAA 1980 

CGGCCAAGCT 2040 

GTGTCGTGCG 2100 

ATTACTGGGT 2160 

TGCAACTAAA 222 0 

CACAGAAGCA 22 80 

CAACAACTCT 2 340 

GGAAACCATT 240 0 

GCATCATCAT 2460 

CACTTACTCG 2520 

TAATCAGAAT 25 80 

AAGAGGATCT 2 640 

TGACTTTTTA 2 700 

ATAATGTCAC 2760 

TATTGTAAAG 2 82 0 

ATGCTACTCA 2 880 

AAAATGTTAA 2 940 

AAGCATCTGC 3 00 0 

TAGTCCAACA 30 60 

AGTTTAAAAA 3120 

AACAATGAAG 3180 

CTACTGCACT 3240 

GTAGCAATTT 3 3 00 

TCAATGCAAT 33 60 

GGCTGGGGTA 342 0 

TAAATGCTGC 3480 

GTTTAAAATT 3 540 

AATGGAACAG 3 60 0 

GCAAACTGGG 3 660 

AGATGAGGTG 3 720 

AAGTTAAATC 3 780 

TAGATCCAAA 3 840 

CTTACTGAAA 3 900 

ACCTGAT CAG 3 960 

TGGCATTGGC 4020 

CTAAAGCAAC 4080 

AGCGTGAATT 4140 

AATAGAAATT 42 00 

CTTTGGGAGA 42 60 

AGGCCTTCAA 4320 

CTGCTTCATA 43 80 

TGCCATTTGA 4440 

GTGAGAAATC 4500 

GCCTGAACTG 4560 

AGCCCTCCTT 462 0 

TATTCCTACA 4680 

TTTTTATTGC 4740 

GAGTGCAGTG 480 0 

TCCTGCCTCA 4860 

TTTTTGTATT 4 920 

TGACCTCGTG 4980 

CGCTCCCGGC 5040 

GTGTGAAAGT 5100 

AGAAGCCAGG 5160 

GTAAGCCTAG 522 0 

TGAAACACCC 52 80 

CAAGACTTTA 5340 

ATAAAACCTC 5400 

TATGCCCGAA 5460 

TATATTTTCA 5520 

TTTGAGTGTG 5580 

GAATTTTTTA 5640 

AAAATGCAGT 5700 

GAAGTTACTT 5760 

AAGTAATATT 582 0 

TTGCTGTATT 5880 

CTGGCATGGA 5940 

ACAATGTTTC 6000 

TCACTATTTT 60 60 

TTGATCGGGT 6120 

ACACTGACAC 6180 
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AGGGGTTTTA CTTTGAGGAC CAGTGTAGTC AAGGGAAAAC ATGAGTTAAA AAGAAAAGCA 6240 

GGCAATATTG CAGTCTTGAT TCTGCCACTT ACAGGATAGA TAATGCCTGA ACTTTAATGA 63 00 

CAAGATGATC CAACCATAAA GGTGCTCTGT GCTTCACAGT GAATCTTTTC CCCATGCAGG 63 60 

AGTGTGCTCC CCTACAAACG TTAAGACTGA TCATTTCAAA AATCTATTAG CTATATCAAA 642 0 

5 AGCCTTACAT TTTAATATAG GTTGAACCAA AATTTCAATT CCAGTAACTT CTATTGTAAC 64 80 

CATTATTTTT GTGTATGTCT TCAAGAATGT TCATTGGATT TTTGTTTGTA ATAGTAAAAT 6540 

AC CGG AT AC A TTTCACGTGT CCTTCAGTAT TGATTTGGTT GAATATTGGG TCATAATGGT 660 0 

TG AGAAG CAT GGACACTAGA GCCAGAATGC TTGGATATGA ATCCTGGATC TGT CACTTAC 6660 

TTCTGTGTGA CCTTTGAAAG GCTACTTATT TCCTCTCTTA GCTTTCTCAT TAAAATCAAT 6720 

10 GAACAATGCC AGCCTCATGG GGTTGTTGAA TGATTAAATT AGTTAATATA CCTAAAGTAC 6780 

ATAGAACACT GCCTGCACAT AGTAAAAGAA TTATAAGTGT GAGGTAGTTG GTAAAATTAT 6840 

GTAGTTGGAT ATACTACCGA ACAATATCTA ATCTCTTTTT AGGGAAATAA AGTTTGTGCA 690 0 
TATATATAAT CCCGAAACAT G 

15 Seq ID NO: 529 Protein sequence 
Protein Accession #: NP 001932.1 



1 11 21 31 41 51 

on I I I I 1 I 

2(J MAAAGPRRSV RGAVCLHLLL TLVIFSRDGE ACKKVILNVP SKLEADKIIG RVNLEECFRS 60 

ADLIRSSDPD FRVLNDGSVY TARAVALSDK KRSFTIWLSD KRKQTQKEVT VLLEHQKKVS 12 0 

KTRHTRETVL RRAKRRW AP I PCSMQENSLG PFPLFLQQVE SDAAQNYTVF YS I SGRGVDK 180 

EPLNLFYIER DTGNLFCTRP VDREEYDVFD LIAYASTADG YSADLPLPLP I RVED ENDNH 240 

PVFTEAIYNF EVLESSRPGT TVGWCATDR DEPDTMHTRL KYSILQQTPR SPGLFSVHPS 300 

25 TGVITTVSHY LDREWDKYS LIMKVQDMDG QFFGLIGTST CIITVTDSND NAPTFRQNAY 360 

EAFVEENAFN VEILRIPIED KDLINTANWR VNFTILKGNE NGHFKI STDK ETNEGVLSW 42 0 

KPLNYEENRQ VNLEIGVNNE APFARD I PRV TALNRALVTV HVRDLDEGPE CTPAAQYVRI 480 

KENLAVGSKI NGYKA YD PEN RNGNGLRYKK LHDPKGWITI DEISGSIITS KILDREVETP 540 

KNELYNITVL AIDKDDRSCT GTLAVNIEDV NDNPPEILQE YWICKPKMG YTDILAVDPD 60 0 

30 EPVHGAPFYF SLPNTSPEIS RLWSLTKVND TAARLSYQKN AGFQEYTIPI TVKDRAGQAA 660 

TKLLRVNLCE CTHPTQCRAT SRSTGVILGK WAILAILLGI ALLFSVLLTL VCGVFGATKG 72 0 

KRFPEDLAQQ NDIISNTEAP GDDRVCSANG FMTQTTNNSS QGFCGTMGSG MKNGGQETIE 780 

MMKGGNQTLE SCRGAGHHHT LDSCRGGHTE VDNCRYTYSE WHSFTQPRLG EKLHRCNQNE 840 
DRMPSQDYVL TYNYEGRGSP AGSVGCCSEK QEEDGLDFLN NLEPKFITLA EACTKR 



40 



Seq ID NO: 530 DNA sequence 

Nucleic Acid Accession #: NM_016583.2 

Coding sequence : 72 . . 842 



1 11 21 31 41 51 

I I I 1 1 I 

GGAGTGGGGG AGAGAGAGGA GACCAGGACA GCTGCTGAGA CCTCTAAGAA GTCCAGATAC 60 

TAAGAGCAAA GATGTTTCAA ACTGGGGGCC TCATTGTCTT CTACGGGCTG TTAGCCCAGA 120 

45 CCATGGCCCA GTTTGGAGGC CTGCCCGTGC CCCTGGACCA GACCCTGCCC TTGAATGTGA 18 0 

ATCCAGCCCT GCCCTTGAGT CCCACAGGTC TTGCAGGAAG CTTGACAAAT GCCCTCAGCA 240 

ATGGCCTGCT GTCTGGGGGC CTGTTGGGCA TTCTGGAAAA CCTTCCGCTC CTGGACATCC 300 

TGAAGCCTGG AGGAGGTACT TCTGGTGGCC TCCTTGGGGG ACTGCTTGGA AAAGTGACGT 360 

CAGTGATTCC TGGCCTGAAC AACATCATTG ACATAAAGGT CACTGACCCC CAGCTGCTGG 420 

50 AACTTGGCCT TGTGCAGAGC CCTGATGGCC ACCGTCTCTA TGTCACCAT C CCTCTCGGCA 480 

TAAAGCTCCA AGTGAATACG CCCCTGGTCG GTGCAAGTCT GTTGAGGCTG GCTGTGAAGC 540 

TGGACATCAC TGCAGAAATC TTAGCTGTGA GAGATAAGCA GGAGAGGATC CACCTGGTCC 600 

TTGGTGACTG CACCCATTCC CCTGGAAGCC TGCAAATTTC TCTGCTTGAT GGACTTGGCC 660 

CCCTCCCCAT TCAAGGTCTT CTGGACAGCC TCACAGGGAT CTTGAATAAA GTCCTGCCTG 720 

55 AGTTGGTTCA GGGCAACGTG TGCCCTCTGG TCAATGAGGT TCTCAGAGGC TTGGACATCA 780 

CCCTGGTGCA TGACATTGTT AACATGCTGA TCCACGGACT ACAGTTTGTC ATCAAGGTCT 840 

AAGCCTTCCA GGAAGGGGCT GGCCTCTGCT GAGCTGCTTC CCAGTGCTCA CAGATGGCTG 900 

GCCCATGTGC TGGAAGATGA CACAGTTGCC TTCTCTCCGA GGAACCTGCC CCCTCTCCTT 960 

TCCCACCAGG CGTGTGTAAC ATCCCATGTG CCTCACCTAA TAAAATGGCT CTTCTTCTGC 1020 

60 AAAAAAAAAA AAAAAAAAAA AAAAAAAAA 



Seq ID NO: 531 Protein sequence 
Protein Accession #: NP_057667.1 

65 1 11 21 31 41 51 

l l I l l I 

MFQTGGLIVF YGLLAQTMAQ FGGLPVPLDQ TLPLNVNPAIi PLSPTGLAGS LTNALSNGLL 60 

SGGLLGILEN LPL>LDIL>KPG GGTSGGLLGG LLGKVTSVIP GLNNIIDIKV TDPQLLELGL 120 

VQSPDGHRLY VTIPLGIKLQ VNTPLVGASL LRLAVKLDIT AEILAVRDKQ ERIHLVLGDC 180 

70 THSPGSLQIS LLDGLGPLPI QGDLDSLTGI LNKVLPELVQ GNVCPLVNEV LRGLDITLVH 24 0 

DIVNMLtlHGL QFVIKV 



Seq ID NO: 532 DNA sequence 
75 Nucleic Acid Accession #: NM_0043 63.1 
Coding sequence: 115.. 2223 

1 11 21 31 41 51 

on I 1 1 1 1 1 

OU CTCAGGGCAG AGGGAGGAAG GACAG CAGAC CAGACAGTCA CAGCAGCCTT GACAAAACGT 60 

TCCTGGAACT CAAGCTCTTC TCCACAGAGG AGGACAGAGC AGACAGCAGA GACCATGGAG 12 0 
TCTCCCTCGG CCCCTCCCCA CAGATGGTGC ATCCCCTGGC AGAGGCTCCT GCTCACAGCC 180 
TCACTTCTAA CCTTCTGGAA CCCGCCCACC ACTGCCAAGC TCACTATTGA ATCCACGCCG 240 
TTCAATGTCG CAGAGGGGAA GGAGGTGCTT CTACTTGTCC ACAATCTGCC CCAGCATCTT 300 

85 TTTGGCTACA GCTGGTACAA AGGTGAAAGA GTGGATGGCA ACCGTCAAAT TATAGGATAT 360 

GTAATAGGAA CTCAACAAGC TACCCCAGGG CCCGCATACA GTGGTCGAGA GATAATATAC 420 
CCCAATGCAT CCCTGCTGAT CCAGAACATC ATCCAGAATG ACACAGGATT CTACACCCTA 480 
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CACGTCATAA AGTCAGATCT 
GAGCTGCCCA AGCCCTCCAT 
GTGGCCTTCA CCTGTGAACC 
CAGAGCCTCC CGGTCAGTCC 
TTCAATGTCA CAAGAAATGA 
GCCAGGCGCA GTGATTCAGT 
TCCCCTCTAA ACACATCTTA 
TCTAACCCAC CTGCACAGTA 
GAGCTCTTTA TCCCCAACAT 
AACTCAGACA CTGGCCTCAA 
CCCAAACCCT TCATCACCAG 
TTAACCTGTG AACCTGAGAT 
CTCGCGGTCA GTCCCAGGCT 
GTCACAAGGA ATGATGTAGG 
CACAGCGACC CAGT CATCCT 
TCATACACCT ATTACCGTCC 
CCACCTGCAC AGTATTCTTG 
TTTATCTCCA ACATCACTGA 
GCCAGTGGCC ACAGCAGGAC 
CCCTCCATCT CCAGCAACAA 
TGTGAACCTG AGGCTCAGAA 
GTCAGTCCCA GGCTGCAGCT 
AGAAATGACG CAAGAGCCTA 
GACC CAGTCA CCCTGGATGT 
TCGTCTTACC TTTCGGGAGC 
CCGCAGTATT CTTGGCGTAT 
GCCAAAATCA CGCCAAATAA 
GGCCGCAATA ATTCCATAGT 
CTCTCAGCTG GGGCCACTGT 
TAGCAGCCCT GGTGTAGTTT 
TAAAGCATTT GCAACAGCTA 
AG AC T C T G AC CAGAG AT CGA 
AAATACAAAA ATGAGCTGGG 
TGAGGCAGGA GAATCGCTTG 
ACTGCACTCC AGTCTGGCAA 
TCTGACCTGT ACTCTTGAAT 
AACTTTAATG AACTAACTGA 
TAATTAATTT CATGGGACTA 
TTCCCAGATT TCAGGAAACT 
AAATATACTT TTGTGAACAA 
AGACTTGGGA AACTATTCAT 
TCAATAAAAA TCTGCTCTTT 
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TGTGAATGAA 
CTCCAGCAAC 
TGAGACTCAG 
CAGGCTGCAG 
CACAGCAAGC 
CATCCTGAAT 
CAGATCAGGG 
CTCTTGGTTT 
CACTGTGAAT 
TAGGACCACA 
CAACAACTCC 
TCAGAACACA 
GCAGCTGTCC 
ACCCTATGAG 
GAATGTCCTC 
AGGGGTGAAC 
GCTGATTGAT 
GAAGAACAGC 
TACAGTCAAG 
CTCCAAACCC 
CACAACCTAC 
GTCCAATGGC 
TGTATGTGGA 
CCTCTATGGG 
GAACCTCAAC 
CAATGGGATA 
TAACGGGACC 
CAAGAGCATC 
CGGCAT CATG 
CTTCATTTCA 
CAGT CTAAAA 
GACCATCCTA 
CTTGGTGGCG 
AACCCGGGAG 
CAGAGCAAGA 
ACAAGTTTCT 
CAGCTTCATG 
AATGAACTAA 
TTTTTTCTTT 
AAATTGAGAC 
GAATATTTAT 
GTATAACAGA 



GAAGCAACTG 
AACTCCAAAC 
GACGCAACCT 
CTGTCCAATG 
TACAAATGTG 
GTCCTCTATG 
GAAAATCTGA 
GTCAATGGGA 
AATAGTGGAT 
GTCACGACGA 
AACCCCGTGG 
ACCTACCTGT 
AATGACAACA 
TGTGGAATCC 
TATGGCCCAG 
CTCAGCCTCT 
GGGAACATCC 
GGACTCTATA 
ACAATCACAG 
GTGGAGGACA 
CTGTGGTGGG 
AACAGGACCC 
ATCCAGAACT 
CCGGACACCC 
CTCTCCTGCC 
CCGCAGCAAC 
TATGCCTGTT 
ACAGTCTCTG 
ATTGGAGTGC 
GGAAGACTGA 
TTGCTTCTTT 
GCCAACATCG 
CGCACCTGTA 
GTGGAGATTG 
CTCCATCTCA 
GATACCACTG 
AAACTGTCCA 
TGAGGATTGC 
TAAGCTATCC 
ATTTACATTT 
ATTGTATGGT 
AAAA 



GCCAGTTCCG 
CCGTGGAGGA 
ACCTGTGGTG 
GCAACAGGAC 
AAACCCAGAA 
GCCCGGATGC 
ACCTCTCCTG 
CTTTCCAGCA 
CCTATACGTG 
TCACAGTCTA 
AGGATGAGGA 
GGTGGGTAAA 
GGACCCTCAC 
AGAACGAATT 
ACGACCCCAC 
CCTGCCATGC 
AGCAACACAC 
CCTGCCAGGC 
TCTCTGCGGA 
AGGATGCTGT 
TAAATGGTCA 
TCACTCTATT 
CAGTGAGTGC 
CCATCATTTC 
ACTCGGCCTC 
ACACACAAGT 
TTGTCTCTAA 
CATCTGGAAC 
TGGTTGGGGT 
CAGTTGTTTT 
ACCAAGGATA 
TGAAACCCCA 
GTCCCAGTTA 
CAGTGAGCCC 
AAAAGAAAAG 
CACTGTCTGA 
CCAAGATCAA 
TGATTCTTTA 
ACTCTTACAG 
TCTCCCTATG 
AATATAGTTA 



GGTATACCCG 540 

CAAGGATGCT 600 

GGTAAACAAT 660 

CCTCACTCTA 720 

CCCAGTGAGT 780 

CCCCACCATT 840 

CCACGCAGCC 900 

ATCCACCCAA 960 

CCAAGCCCAT 102 0 

TGCAGAGCCA 10 80 

TGCTGTAGCC 1140 

TAATCAGAGC 12 00 

T CTACT CAGT 12 60 

AAGTGTTGAC 1320 

CATTTCCCCC 13 80 

AGCCTCTAAC 1440 

ACAAGAGCTC 150 0 

CAATAACTCA 1560 

GCTGCCCAAG 1620 

GGCCTTCACC 1680 

GAGCCTCCCA 1740 

CAATGTCACA 1800 

AAACCGCAGT 1860 

CCCCCCAGAC 192 0 

TAACCCATCC 1980 

TCTCTTTATC 2040 

CTTGGCTACT 2100 

TTCTCCTGGT 2160 

TGCTCTGATA 2220 

GCTTCTTCCT 2280 

TTTACAGAAA 2340 

TCTCTACTAA 240 0 

CTCGGGAGGC 2460 

AGATCGCACC 252 0 

AAAAGAAGAC 2 580 

GAATTTCCAA 2 640 

G CAGAG AAAA 2700 

AATGTCTTGT 2760 

CAATTTGATA 2820 

TGGTCGCTCC 2 880 

TTGCACAAGT 2 940 



Seq ID NO: 533 Protein sequence 
45 Protein Accession #: NP 004354.1 



50 



55 



60 



MESPSAPPHR 
HLFGYSWYKG 
TLHVI KSDLV 
NNQSLPVSPR 
TISPLNTSYR 
AHNSDTGLNR 
QSLPVSPRLQ 
SPSYTYYRPG 
NSASGHSRTT 
LPVSPRLQLS 
PDSSYLSGAN 
ATGRNNS I VK 



11 
I 

WCIPWQRLLL 
ERVDGNRQII 
NEEATGQFRV 
LQLSNGNRTL 
SGENLNLSCH 
TTVTT I TVYA 
LSNDNRTLTL 
VNLSLSCHAA 
VKTITVSAEL 
NGNRTLTL FN 
LNLSCHSASN 
SITVSASGTS 



21 
I 

TASLLTFWNP 
GYVIGTQQAT 
YPELPKPSIS 
TLFNVTRNDT 
AASNPPAQYS 
EPPKPFITSN 
LSVTRNDVGP 
SNPPAQYSWL 
PKPSISSNNS 
VTRNDARAYV 
PSPQYSWRIN 
PGLSAGATVG 



31 

PTTAKLTIES 
PGPAYSGREI 
SNNSKPVEDK 
ASYKCETQNP 
WFVNGTFQQS 
NSNPVEDEDA 
YECGIQNELS 
IDGNIQQHTQ 
KPVEDKDAVA 
CGIQNSVSAN 
GIPQQHTQVL 
IMIGVLVGVA 



41 

1 

TPFNVAEGKE 
IYPNASLLIQ 
DAVAFTCEPE 
VSARRSDSVI 
TQELFIPNIT 
VALTCEPEIQ 
VDHSDPVILN 
ELFISNITEK 
FTCEPEAQNT 
RSDPVTLDVL 
FIAKITPNNN 
LI 



I 1 

VLLLVHNLPQ 60 

NIIQNDTGFY 12 0 

TQDATYLWWV 180 

LNVLYGPDAP 240 

VNNSGSYTCQ 3 00 

NTTYLWWVNN 3 60 

VLYGPDDPTI 42 0 

NSGLYTCQAN 480 

TYLWWVNGQS 540 

YGPDTPIISP 600 

GTYACFVSNL 660 



65 



70 



75 



Seq ID NO: 534 DNA sequence 

Nucleic Acid Accession #: NM_006952.1 

Coding sequence: 11.. 793 



80 



AAT CCCGACA 
TGGAAATGTG 
ATCTGACCAA 
GGCTGCCTGG 
TGTAGGCATC 
AGTATATGCC 
ACCCAACCTC 
TGATGACCAG 
CAATTGCTGT 
TGAGAATAAT 
AGAACCTCTC 
CTGCTATGAA 
ATTTGCCATT 
AATTGAATAT 



11 
I 

ATGGCGAAAG 
ATTATTGGTT 
CACAGCCTCT 
ATCGGCATAT 
ATGAAGTCCA 
TTTGAAGTGG 
TTCCTGAAGC 
TGGAAAAACA 
GGCGTAAATG 
GATGCTGACT 
AACCTGGAGG 
CTGATCTCTG 
CTCTGCTGGA 
TAAGAA 



21 
I 

ACAACTCAAC 
GTTGCGGCAT 
ACCCACTGCT 
TTGTGGGCAT 
GCAGGAAAAT 
CATCTTGTAT 
AGATGCTAGA 
ATGGAGTCAC 
GTCCATCAGA 
ATCCCTGGCC 
CTTGTAAACT 
GTCCAATGAA 
CTTTTTGGGT 



31 
I 

TGTTCGTTGC 
TGCCCTGACT 
TGAAGCCACC 
CTGCCTCTTC 
TCTTCTGGCG 
CACAGCAGCA 
GAGGTACCAA 
CAAAACCTGG 
CTGGCAAAAA 
TCGTCAATGC 
AGGCGTGCCT 
CCGACACGCC 
TCTCCTGGGT 



41 
I 

TTCCAGGGCC 
GCGGAGTGCA 
GACAACGATG 
TGCCTGTCTG 
TATTTCATTC 
ACACAACGAG 
AACAACAG C C 
GACAGGCTCA 
TACACATCTG 
TGTGTTATGA 
GGTTTTTATC 
TGGGGGGTTG 
ACCATGTTCT 



51 
I 

TGCTGATTTT 60 

TCTTCTTTGT 12 0 

ACATCTATGG 180 

TTCTAGGCAT 240 

TGATGTTTAT 300 

ACTTTTTCAC 3 60 

CTCCAAACAA 42 0 

TGCTCCAGGA 480 

CCTTCCGGAC 540 

ACAATCTTAA 600 

ACAAT CAGGG 660 

CCTGGTTTGG 72 0 

ACTGGAGCAG 7 80 



85 



Seq ID NO: 535 Protein sequence 
Protein Accession #: NP 008883.1 



11 



21 



31 
1 



41 



51 



390 



WO 02/086443 

MAKDNSTVRC FQGLLIFGNV IIGCCGIALT AECIFFVSDQ HSLYPLLEAT DNDD I YGAAW 60 

IGIFVGICLF CLSVLGIVGI MKSSRKILLA YFILMFIVYA FEVASCITAA TQRDFFTPNL 12 0 

FLKQMLERYQ NNSPPNNDDQ WKNNGVTKTW DRLMLQDNCC GVNGPSDWQK YTSAFRTENN 180 

DADYPWPRQC CVMNNLKEPL NLEACKLGVP GFYHNQGCYE LISGPMNRHA WGVAWFGFAI 240 
LCWTFWVLLG TMFYWSRIEY 



PCT/US02/12476 



10 



15 



20 



25 



30 



Seq ID NO: 536 DNA sequence 

Nucleic Acid Accession #: NM_002638.1 

Coding sequence: 120.. 473 



11 



CAATACAGCT 
GCTGGACTGC 
TGAGGGCCAG 
AGGCAGCTGT 
T CAATGGAC A 
CGCAAGAGCC 
TCCGGTGCGC 
TCAAGAAGTG 
CGGTCCTTGC 
TGCTGCCCTT 
GAGCTGCCTC 



AAGGAATTAT 
ATAAAGATTG 
CAGCTTCTTG 
CACGGGAGTT 
AGATCCCGTT 
AGT CAAAGGT 
CATGTTGAAT 
CTGTGAAGGC 
TGCACCTGTG 
CCCCTTCCCA 
TCTCATCCAC 



21 
I 

CCCTTGTAAA 
GTATGGCCTT 
ATCGTGGTGG 
CCTGTTAAAG 
AAAGGACAAG 
CCAGTCTCCA 
CCCCCTAACC 
TCTTGCGGGA 
CCGTCCCCAG 
CACTGT CCAT 
TTTCCAATAA 



31 

I 

TACCACAGAC 
AGCTCTTAGC 
TGTTCCTCAT 
GTCAAGACAC 
TTTCAGTTAA 
CTAAGCCTGG 
GCTGCTTGAA 
TGGCCTGTTT 
AGCTACAGGC 
TCTTCCTCCC 
A 



41 
I 

CCGCCCTGGA 
CAAACACCTT 
CGCTGGGACG 
TGTCAAAGGC 
AGGT CAAG AT 
CTCCTGCCCC 
AGATACTGAC 
CGTTCCCCAG 
CCCATCTGGT 
ATT CAGG ATG 



51 



GCCAGGCCAA 
CCTGACACCA 
CTGGTTCTAG 
CGTGTTCCAT 
AAAGTCAAAG 
ATTATCTTGA 
TGCCCAGGAA 
TGAAGGGAGC 
CCTAAGTCCC 
CCCACGGCTG 



Seq ID NO: 537 Protein sequence 
Protein Accession #: NP_002 629.1 

1 11 21 31 41 51 

I I 1 I -I I 

MRASSFLIW VFLIAGTIiVL EAAVTGVPVK GQDTVKGRVP FNGQDPVKGQ VSVKGQDKVK 

AQEPVKGPVS TKPGSCPIIL IRCAMLNPPN RCLKDTDCPG IKKCCEGSCG MACFVPQ 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 



60 



35 



Seq ID NO: 53 8 DNA sequence 

Nucleic Acid Accession #: NM_001793.2 

Coding sequence: 71., 2560 



40 



45 



50 



55 



60 



65 



70 



75- 



80 



85 



AAAGGGGCAA 
CTCTGCAGCC 
CTGGCTGCAG 
CTTGGAGGCG 
CTGCCCTGGG 
TGGCGAGACA 
ATCCAAACGT 
TGAAAATGGC 
AGACACCAAG 
CTTCGCTGTA 
GATTGCCAAG 
CCCCATGAAC 
GGACACCTTC 
GACAGCCACG 
CCATAGCCAA 
CACCATCAGC 
CATCCAGGCC 
GATCCTTGAT 
GCCTGAGAAT 
CAACTCACCA 
TACCATCACC 
TTTTGAGGCC 
GCTGAAGCTC 
ACCTGTGTTT 
GCCTGTGTGT 
CATCCTGAGA 
TGTGGGCACC 
GGTCTTGGCC 
ACTGATTGAT 
CCAAAGCCCT 
CCCTTTCCAG 
GGAAGGTGAC 
GCACCTTTCT 
GTGCGACTGC 
CCCTGTGCTG 
GAGAAAGAAG 
CGTCTTCTAC 
GCTCCACCGA 
CATCATCCCG 
TATAATTGAG 
CTTGGTGTTC 
CTCCGCCTCC 
GAAGCTGGCA 
GGGACCAAAC 
GACTTCGGAG 
ACGTTAGAGT 
AGCACTGAAA 
TCTTACCTGC 
TACAGTGGAC 



11 
I 

GAGCTGAGCG 
ATGGGGCTCC 
TGCGCGGCCT 
GGAGGCGCGG 
CAAGAGCCAG 
GTC CAGG AAA 
ATCTTACGAA 
AAGGGTCCCT 
ATTTTCTACA 
GAGAAGGAGA 
TATGAGCTCT 
ATCTCCATCA 
CGAGGGAGTG 
GATGAGGATG 
GAACCAAAGG 
GTCATCTCCA 
ACAGACATGG 
GCCAATGACA 
GCAGTGGGCC 
GCGTGGCGTG 
ACCCACCCTG 
AAAAACC AG C 
CCAACCTCCA 
GTCCCACCCT 
GTCTACACTG 
GACCCAGCAG 
CTCGACCGTG 
ATGGACAATG 
GTCAATGACC 
GTGCGCCAGG 
GCCCAGCTCA 
ACAGTGGTCT 
CTGTCTGACC 
CATGGCCATG 
GGGGCTGTCC 
CGGAAGATCA 
TATGGCGAAG 
GGTCTGGAGG 
ACACCCATGT 
AACCTGAAGG 
GACTATGAGG 
GACCAAGACC 
GACATGTACG 
GTCAGGCCAC 
CTTGTCAGGA 
GGTTGCTTCC 
ACCTCTCCAC 
CGTAAAATGC 
TTTCTCTCTG 



21 
I 

GAACACCGGC 
CTCGTGGACC 
CCGAGCCGTG 
AGCAGGAGCC 
CTCTGTTTAG 
GAAGGT CACT 
GACACAAGAG 
TCCCCCAGAG 
GCATCACGGG 
CAGGCTGGTT 
TTGGCCACGC 
TCGTGACCGA 
TCTTAGAGGG 
ATGCCATCTA 
ACCCACACGA 
GTGGCCTGGA 
ATGGGGACGG 
ATGCTCCCAT 
ATGAGGTGCA 
CCACCTACCT 
AGAGCAACCA 
ACACCCTGTA 
CAGCCACCAT 
CCAAAGTCGT 
CAGAAGACCC 
GGTGGCTAGC 
AGGATGAGCA 
GAAGCCCTCC 
ATGGCCCAGT 
TGCTGAACAT 
CAGATGACTC 
TGTCCCTGAA 
ATGGCAACAA 
TCGAAACCTG 
TGGCTCTGCT 
AGGAGCCCCT 
AGGGGGGTGG 
CCAGGCCGGA 
ACCGTCCTCG 
CGGCTAACAC 
GCAGCGGCTC 
AAGATTACGA 
GTGGCGGGGA 
AGAGCATCTC 
AGTGGCCGTA 
TTAGCCTTTC 
CTGGGCCAGG 
TCAACCCTGT 
GAATGGAACC 



31 
I 

CCGCCGTCGC 
TCTCGCGTCT 
CCGGGCGGTC 
CGGCCAGGCG 
CACTGATAAT 
GAAGGAAAGG 
AGATTGGGTG 
ACTGAATCAG 
GCCGGGGGCA 
GTTGTTGAAT 
TGTGTCAGAG 
CCAGAATGAC 
AGTCCTACCA 
CACCTACAAT 
CCTCATGTTC 
CCGGGAAAAA 
CTCCACCACC 
GTTTGACCCC 
GAGGCTGACG 
TATCATGGGC 
GGGCATCCTG 
CGTTGAAGTG 
AGTGGTCCAC 
TGAGGTCCAG 
TGACAAGGAG 
CATGGACCCA 
GTTTGTGAGG 
CACCACTGGC 
CCCTGAGCCC 
CACGGACAAG 
AGACAT CTAC 
GAAGTTCCTG 
AGAGCAGCTG 
CCCTGGACCC 
GTTCCTCCTG 
CCTACTCCCA 
CGAAGAGGAC 
GGTGGTTCTC 
GCCAGCCAAC 
AGACCCCACA 
CGACGCCGCG 
TTATCTGAAC 
GGACGACTAG 
CAAGGGGTCT 
GCAACTTGGC 
AGGATGGAGG 
GTTGCCTCAG 
GTCCTGGGCC 
TTCTTAGGCC 



41 



GGCAGCTGCT 
CTCCTCCTTC 
TTCAGGGAGG 
CTGGGGAAAG 
GATGACTTCA 
AATCCATTGA 
GTTGCTCCAA 
CTCAAGTCTA 
GACAGCCCCC 
AAGCCACTGG 
AATGGTGCCT 
CACAAGCCCA 
GGTACTTCTG 
GGGGTGGTTG 
ACCATTCACC 
GTCCCTGAGT 
ACGGCAGTGG 
CAGAAGTACG 
GTCACTGATC 
GGTGACGACG 
ACAACCAGGA 
ACCAACGAGG 
GTGGAGGATG 
GAGGGCATCC 
AATCAAAAGA 
GACAGTGGGC 
AACAACATCT 
ACGGGAACCC 
CGTCAGATCA 
GACCTGTCTC 
TGGACGGCAG 
AAGCAGGATA 
ACGGTGATCA 
TGGAAGGGAG 
CTGGTGCTGC 
GAAGATGACA 
CAGGACTATG 
CGCAATGACG 
CCAGATGAAA 
GCCCCGCCCT 
TCCCTGAGCT 
GAGTGGGGCA 
GCGGCCTGCC 
CAGTTCCCCC 
GGAGACAGGC 
AATGTGGGCA 
AGGCCAAGTT 
TGGGCCTGCT 
TCCTGGTGCA 



51 
I 

TCACCCCTCT 6 0 

TCCAGGTTTG 12 0 

CTGAAGTGAC 180 

TATTCATGGG 240 

CTGTGCGGAA 3 00 

AGATCTTCCC 3 60 

TATCTGTCCC 42 0 

ATAAAGATAG 480 

CTGAGGGTGT 540 

ACCGGGAGGA 600 

CAGTGGAGGA 660 

AGTTTACCCA 72 0 

TGATGCAGGT 7 8 0 

CTTACTCCAT 840 

GGAGCACAGG 900 

ACACACTGAC 960 

CAGTAGTGGA 102 0 

AGGCCCATGT 1080 

TGGACGCCCC 1140 

GGGACCATTT 12 0 0 

AGGGTTTGG A 12 60 

CCCCTTTTGT 132 0 

TGAATGAGGC 13 80 

CCACTGGGGA 144 0 

TCAGCTACCG 15 0 0 

AGGT C ACAGC 1560 

ATGAAGTCAT 162 0 

TTCTGCTAAC 1680 

CCATCTGCAA 1740 

CCCACACCTC 18 0 0 

AGGT CAACG A 18 60 

CAT ATGACGT 192 0 

GGGCCACTGT 1980 

GTTTCATCCT 2 040 

TTTTGTTGGT 210 0 

CCCGTGACAA 2160 

ACATCACCCA 2220 

TGGCACCAAC 22 80 

TCGGCAACTT 2340 

ACGACACCCT 2400 

CCCTCACCTC 2460 

GCCGCTTCAA 2 520 

TGCAGGGCTG 2580 

TTCAGCTG AG 2 640 

TATGAGTCTG 2 700 

GTTTGACTTC 2760 

TCCAGAAGCC 2 82 0 

GTGACTGACC 2 8 80 

ACTTAATTTT 2 940 



391 



WO 02/086443 

TTTTTTTAAT GCTATCTTCA AAACGTTAGA GAAAGTT CTT CAAAAGTGCA GCCCAGAGCT 3 000 

GCTGGGCCCA CTGGCCGTCC TGCATTTCTG GTTT CCAGAC CCCAATGCCT CCCATTCGGA 3060 

TGGATCTCTG CGTTTTTATA CTGAGTGTGC CTAGGTTGCC CCTTATTTTT TATTTTCCCT 3120 

GTTGCGTTGC TATAGATGAA GGGTGAGGAC AATCGTGTAT ATGTACTAGA ACTTTTTTAT 3180 
TAAAGAAACT TTTCCCAGAA AAAAA 



PCT/US02/12476 



Seq ID NO: 53 9 Protein sequence 
Protein Accession #: NP_001784.2 



10 



15 



20 



25 



30 



35 



40 



45 



MGLPRGPLAS 
QEPALFSTDN 
KGPFPQRLNQ 
YELFGHAVSE 
DEDDAIYTYN 
TDMDGDGSTT 
AWRATYLIMG 
PTSTATIWH 
DPAGWLAMDP 
VNDHGPVPEP 
TWLSLKKFL 
GAVLALIiFLL 
GLEARPEWL 
DYEGSGSDAA 



11 

1 

LLLLQVCWLQ 
DDFTVRNGET 
LKSUKDRDTK 
NGASVEDPMN 
GWAYSIHSQ 
TAVAWEILD 
GDDGDHFTIT 
VEDVNEAPVF 
DSGQVTAVGT 
RQITICNQSP 
KQDTYDVHLS 
LVLLLLVRKK 
RNDVAPTIIP 
SLSSLTSSAS 



21 
I 

CAASEPCRAV 
VQERRSLKER 
IFYSITGPGA 
ISIIVTDQND 
EPKDPHDLMF 
ANDNAPMFDP 
THPESNQGIL 
VPPSKWEVQ 
LDREDEQFVR 
VRQVLNITDK 
LSDHGNKEQL 
RKIKEPLLLP 
TPMYRPRPAN 
DQDQDYDYLN 



31 



41 



FREAEVTLEA 
NPLKIFPSKR 
DSPPEGVFAV 
HKPKFTQDTF 
TIHRSTGTIS 
QKYEAHVPEN 
TTRKGLDFEA 
EGIPTGEPVC 
NNIYEVMVLA 
DLSPHTSPFQ 
TVIRATVCDC 
EDDTRDNVFY 
PDEIGNFIIE 
EWGSRFKKLA 



GGAEQEPGQA 
ILRRHKRDWV 
EKETGWLLLN 
RGSVLEGVLP 
VISSGLDREK 
AVGHEVQRLT 
KNQHTLYVEV 
VYTAEDPDKE 
MDNGSPPTTG 
AQLTDDSDIY 
HGHVETCPGP 
YGEEGGGEED 
NLKAANTDPT 
DMYGGGEDD 



51 

I 

LGKVFMGCPG 
VAPISVPENG 
KPLDREE I AK 
GTSVMQVTAT 
VPEYTLTIQA 
VTDLDAPNSP 
TNEAPFVLKL 
NQKISYRILR 
TGTLLLTLID 
WTAEYNEEGD 
WKGGF I LPVL 
QDYDITQLHR 
APPYDTLLVF 



Seq ID NO: 540 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1 . . 672 



I 

ATGAGGCTCC 
CGGGGCTCCC 
AAGGGCGGGG 
CTGCTCGCCT 
GCGAGACAAC 
TGTCATGTTT 
ACAGAGCCAT 
AAGCAGTGCT 
CTCCTGGAAG 
TTAGAGGGGC 
AG C TGTGGTG 
AGCCTGTCTT 



11 
I 

AAAGACCCCG 
CCTACCGGCC 
AGGGGGCGCC 
TGCTGCTGGT 
GAGATCCAGA 
GTGAGAGAGA 
ACTGCGTTAT 
CCGCTGGTTG 
AGCCCATGCC 
CACCTATCAA 
GGCTGTGGCT 
GA 



21 



31 



I 



I 



ACAGGCCCCG 
AGACCCGGGG 
GCGCGCTGAC 
CGTGGCCCTA 
GGACTCCCAG 
AAACACTTTC 
AGCGGCCGTG 
TGCAGCGATG 
CTTCTTTTAC 
CTCATCAGTG 
GGCCATCCTC 



GCGGGTGGGA 
AGAGGCGCGC 
CCTCCCTGGG 
CCGCGGGTGT 
CGAACGGACG 
GAGTGCCAGA 
AAAATATTTC 
GAGAGACCCA 
CTCAAGTGTT 
TTCAAAGAAT 
CTGCTGCTGG 



41 
I 

GGCGCGCGCC 
GGAGGCTGCG 
CACCGCTGGG 
GGACAGACGC 
AGGGTGACAA 
ACCCAAGGAG 
CACGTTTTTT 
AGCCAGAGGA 
GTAAAATTCG 
ATGCTGGGAG 
CCTCCATTGC 



51 
I 

CCGGGGCGGG 
AAGGTTCCAG 
GACGATGGCG 
CAACCTGACT 
TAGAGTGTGG 
GTGCAAATGG 
CATGGTTGCG 
GAAGCGGTTT 
CTACTGCAAT 
CATGGGTGAG 
AGCCGGCCTC 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 



Seq ID NO: 541 Protein sequence 
Protein Accession #: Eos sequence 



50 



55 



60 



65 



70 



75 



80 



1 11 21 31 41 51 

I I I I I I 

MRLQRPRQAP AGGRRAPRGG RGSPYRPDPG RGARRLRRFQ KGGEGAPRAD PPWAPLGTMA 

LLALLLWAL PRVWTDANLT ARQRDPEDSQ RTDEGDNRVW CHVCERENTF ECQNPRRCKW 

TEPYCVIAAV KIFPRFFMVA KQCSAGCAAM ERPKPEEKRF LLEEPMPFFY LKCCKIRYCN 

LEGPPINSSV FKEYAGSMGE SCGGLWIiAIL LLLASIAAGL SLS 

Seq ID NO: 542 DNA sequence 

Nucleic Acid Accession #: XM_035292.2 

Coding sequence: 53 .. 1576 



85 



GCTCGCTGGG 
TGCGGGCCCG 
GGAGAAGATG 
CGTGACCCTG 
TATCGGCTCG 
GCTGGCGCTG 
CGCGGAGCTC 
CTACGGCTCG 
AT CGCAGTAC 
CTGCCCGGTG 
GGCCGTGAAC 
CAAGCTCCTG 
TGTGTCCAAT 
TGTGCTGGCA 
CACAGAGGAA 
CATCGTGACG 
GCAGATGCTG 
GTCCTGGATC 
GTTCACATCC 
CTCCATGATC 
GACGCTGCTC 
CAACTGGCTC 
TGAGCTTGAG 
CCTCTTCCTG 
CATCATCCTC 
GTGGCTCCTC 



11 

I 

CCGCGGCTCC 
AAGCGGCGCG 
CTGGCCGCCA 
CAGCGGAACA 
GGCATCTTCG 
GTGGTGTGGG 
GGCACCACCA 
CTGCCCGCCT 
ATCGTGGCCC 
CCCGAGGAGG 
TGCTACAGCG 
GCCCTGGCCC 
CTAGATCCCA 
TTATACAGCG 
ATGATCAACC 
CTGGTGTACG 
TCGTCCGAGG 
ATCCCCGTCT 
TCCAGGCTCT 
CACCCACAGC 
TACGCCTTCT 
TGCGTGGCCC 
CGGCCCATCA 
ATCGCCGTCT 
AGCGGGCTGC 
CAGGGCAT CT 



21 

I 

CGGGTGTCCC 
CGCTAGCGGC 
AGAGCGCGGA 
TCACGCTGCT 
TGACGCCCAC 
CCGCGTGCGG 
TCTCCAAATC 
TCCTCAAGCT 
TGGTCTTCGC 
CAGCCAAGCT 
TGAAGGCCGC 
TGATCATCCT 
ACTTCTCATT 
GCCTCTTTGC 
CCTACAGAAA 
TGCTGACCAA 
CCGTGGCCGT 
TCGTGGGCCT 
TCTTCGTGGG 
TCCTCACCCC 
CCAAGGACAT 
TGGCCATCAT 
AGGTGAACCT 
CCTTCTGGAA 
CCGTCTACTT 
TCTCCACGAC 



31 
i 

AGGCCCGGCC 
GCCGGCGGCC 
CGGCTCGGCG 
CAACGGCGTG 
GGGCGTGCTC 
CGTCTTCTCC 
GGGCGGCGAC 
CTGGATCGAG 
CACCTACCTG 
CGTGGCCTGC 
CACCCGGGTC 
GCTGGGCTTC 
TGAAGGCACC 
CTATGGAGGA 
CCTGCCCCTG 
CCTGGCCTAC 
GGACTT CGGG 
GTCCTGCTTC 
GTCCCGGGAA 
CGTGCCGTCC 
CTTCTCCGTC 
CGGCATGATC 
GGCCCTGCCT 
GACACCCGTG 
CTTCGGGGTC 
CGTCCTGTGT 



41 

i 

GGTGCGCAGA 
GAGGAGAAGG 
CCGGCAGGCG 
GCCATCATCG 
AAGGAGGCAG 
ATCGTGGGCG 
TACGCCTACA 
CTGCTCATCA 
CTCAAGCCGC 
CTCTGCGTGC 
CAGGATGCCT 
GTCCAGATCG 
AAACTGGATG 
TGGAATTACT 
GCCATCATCA 
TTCACCACCC 
AACTATCACC 
GGCTCCGTCA 
GGCCACCTGC 
CTCGTGTTCA 
ATCAACTTCT 
TGGCTGCGCC 
GTGTTCTTCA 
GAGTGTGGCA 
TGGTGGAAAA 
CAGAAGCTCA 



51 

I 

GCATGGCGGG 
AAGAGGCGCG 
AGGGCGAGGG 
TGGGGACCAT 
GCTCGCCGGG 
CGCTCTGCTA 
TGCTGGAGGT 
TCCGGCCTTC 
TCTTCCCCAC 
TGCTGCTCAC 
TTGCCGCCGC 
GAAAGGGTGA 
TGGGGAACAT 
TGAATTTCGT 
TCTCCCTGCC 
TGTCCACCGA 
TGGGCGTCAT 
ATGGGTCCCT 
CCTCCATCCT 
CGTGTGTGAT 
TCAGCTTCTT 
ACAGAAAG CC 
TCCTGGCCTG 
TCGGCTTCAC 
ACAAGCCCAA 
TGCAGGTGGT 



60 
120 
180 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 



392 



WO 02/086443 

CCCCCAGGAG ACATAGCCAG GAGGCCGAGT GGCTGCCGGA GGAGCATGC 



Seq ID NO: 543 Protein sequence 
Protein Accession #: XP 035292.2 



1 11 21 31 41 51 

l l l I I l 

MAGAGPKRRA LAAPAAEEKE EAREKMLAAK SADGSAPAGE GEGVTLQRNI TLLNGVAIIV 
GTIIGSGIFV T PTGVLKE AG S PGLALWWA ACGVFSIVGA LCYAELGTTI SKSGGDYAYM 
LEVYGSLPAF LKLWIELLII RPSSQYIVAL VFATYLLKPL FPTCPVPEEA AKLVACLCVL 
LLTAVNCYSV KAATRVQDAF AAAKLLALAL IILLGFVQIG KGDVSNLDPN FSFEGTKLDV 
GNIVLALYSG LFAYGGWNYL NFVTEEMINP YRNLPLAI I I SLPIVTLVYV LTNLAYFTTL 
STEQMLSSEA VAVDFGNYHL GVMSWIIPVF VGLSCFGSVN GSLFTSSRLF FVGSREGHLP 
SILSMIHPQL LTPVPSLVFT CVMTLLYAFS KDIFSVINFF SFFNWLCVAL AIIGMIWLRH 
RKPELERPIK VNLALPVFFI LACLFLIAVS FWKTPVECGI GFTIILSGLP VYFFGWWKN 
KPKWLLQGIF STTVLCQKLM QWPQET 

Seq ID NO: 544 DNA sequence 

Nucleic Acid Accession #t NM_005268.1 

Coding sequences 168.. 989 

1 11 21 31 41 51 

i I I 1 I I 

TAAAAAGCAA AAGAATTCGC GGCCGCGTCG ACACGGGCTT CCCCGAAAAC CTTCCCCGCT 

TCTGGATATG AAATT CAAGC TGCTTGCTGA GTCCTATTGC CGGCTGCTGG GAGCCAGGAG 

AGCCCTGAGG AGTAGTCACT CAGTAGCAGC TGACGCGTGG GTCCACCATG AACTGGAGTA 

TCTTTGAGGG ACTCCTGAGT GGGGTCAACA AGTACTCCAC AGCCTTTGGG CGCATCTGGC 

TGTCTCTGGT CTTCATCTTC CGCGTGCTGG TGTACCTGGT GACGGCCGAG CGTGTGTGGA 

GTGATGACCA CAAGGACTTC GACTGCAATA CTCGCCAGCC CGGCTGCTCC AACGTCTGCT 

TTGATGAGTT CTTCCCTGTG TCCCATGTGC GCCTCTGGGC CCTGCAGCTT ATCCTGGTGA 

CATGCCCCTC ACTGCTCGTG GTCATGCACG TGGCCTACCG GGAGGTTCAG GAGAAGAGGC 

ACCGAGAAGC CCATGGGGAG AACAGTGGGC GCCTCTACCT GAACCCCGGC AAGAAGCGGG 

GTGGGCTCTG GTGGACATAT GTCTGCAGCC TAGTGTTCAA GGCGAGCGTG G AC AT CG C CT 

TTCTCTATGT GTTCCACTCA TTCTACCCCA AATATATCCT CCCTCCTGTG GTCAAGTGCC 

ACGCAGATCC ATGTCCCAAT ATAGTGGACT GCTTCATCTC CAAGCCCTCA GAGAAGAACA 

TTTTCACCCT CTTCATGGTG GCCACAGCTG CCATCTGCAT CCTGCTCAAC CTCGTGGAGC 

TCATCTACCT GGTGAGCAAG AGATGCCACG AGTGCCTGGC AGCAAGGAAA GCTCAAGCCA 

TGTGCACAGG TCATCACCCC CACGGTACCA CCTCTTCCTG CAAACAAGAC GACCTCCTTT 

CGGGTGACCT CATCTTTCTG GGCT CAGACA GTCATCCTCC T CT CT T AC CA GACCGCCCCC 

GAGACCATGT GAAGAAAACC ATCTTGTGAG GGGCTGCCTG GACTGGTCTG GCAGGTTGGG 

CCTGGATGGG GAGGCTCTAG CATCTCTCAT AGGTGCAACC TGAGAGTGGG GGAGCTAAGC 

CATGAGGTAG GGGCAGGCAA GAGAGAGGAT TCAGACGCTC TGGGAGCCAG TTCCTAGTCC 

T CAACTCC AG CCACCTGCCC CAGCTCGACG GCACTGGGCC AGTTCCCCCT CTGCTCTGCA 

GCTCGGTTTC CTTTTCTAGA ATGGAAATAG TGAGGGCCAA TGC 



Seq ID NO: 545 Protein sequence 
Protein Accession #: NP_005259.1 

1 11 21 31 41 51 

I I I I I I 

MNWSIFEGLL SGVNKYSTAF GRIWLSLVFI FRVLVYLVTA ERVWSDDHKD FDCNTRQPGC 

SNVCFDEFFP VSHVRLWALQ LILVTCPSLL WMHVAYREV QEKRHREAHG ENSGRLYLNP 

GKKRGGLWWT YVCSLVFKAS VDIAFLYVFH SFYPKYILPP WKCHADPCP NIVDCFISKP 

SEKNIFTLFM VATAAICILL NLVELIYLVS KRCHECLAAR KAQAMCTGHH PHGTTSSCKQ 

DDLLSGDLIF LGSDSHPPLL PDRPRDHVKK TIL 



Seq ID NO: 546 DNA sequence 

Nucleic Acid Accession #: NM_002391.1 

Coding sequence: 26.. 457 



1 11 21 31 41 51 

I I l I I I 

CGGGCGAAGC AGCGCGGGCA GCGAGATGCA GCACCGAGGC TTCCTCCTCC TCACCCTCCT 
CGCCCTGCTG GCGCTCACCT CCGCGGTCGC CAAAAAGAAA GATAAGGTGA AGAAGGGCGG 
CCCGGGGAGC GAGTGCGCTG AGTGGGCCTG GGGGCCCTGC ACCCCCAGCA GCAAGGATTG 
CGGCGTGGGT TTCCGCGAGG GCACCTGCGG GGCCCAGACC CAGCGCATCC GGTGCAGGGT 
GCCCTGCAAC TGGAAGAAGG AGTTTGGAGC CGACTGCAAG TACAAGTTTG AGAACTGGGG 
TGCGTGTGAT GGGGGCACAG GCACCAAAGT CCGCCAAGGC ACCCTGAAGA AGGCGCGCTA 
CAATGCTCAG TGCCAGGAGA CCATCCGCGT CACCAAGCCC TGCACCCCCA AG AC CAAAG C 
AAAGGCCAAA GCCAAGAAAG GGAAGGGAAA GGACTAGACG CCAAGCCTGG ATGCCAAGGA 
GCCCCTGGTG TCACATGGGG CCTGGCCACG CCCTCCCTCT CCCAGGCCCG AGATGTGACC 
CACCAGTGCC TTCTGTCTGC TCGTTAGCTT TAAT CAATCA TGCCCTGCCT TGTCCCTCTC 
ACTCCCCAGC CCCACCCCTA AGTGCCCAAA GTGGGGAGGG ACAAGGGATT CTGGGAAGCT 
TGAGCCTCCC CCAAAGCAAT GTGAGTCCCA GAGCCCGCTT TTGTTCTTCC CCACAATTCC 
ATTACTAAGA AACACAT CAA ATAAACTGAC TTTTTCCCCC CAATAAAAGC TCTTCTTTTT 
TAATAT 



Seq ID NO: 547 Protein sequence 
Protein Accession #: NP_0023 82.1 

1 ll 21 31 41 ' 51 

l l I l l I 

MQHRGFLLLT LL ALL ALT S A VAKKKDKVKK GGPGSECAEW AWGPCTPSSK DCGVGFREGT 
CGAQTQRIRC RVPCNWKKEF GADCKYKFEN WGACDGGTGT KVRQGTLKKA RYNAQCQETI 
RVTKPCTPKT KAKAKAKKGK GKD 



Seq ID NO; 54 8 DNA sequence 
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Nucleic Acid Accession #: NM_00€ 
Coding sequence: 1..786 

1 11 21 

I i \ 

ATGGATTGGG GGACGCTGCA CACTTTCATC 

GGGAAGGTGT GGATCACAGT CATCTTTATT 

CAGGAAGTGT GGGGTGACGA GCAAGAGGAC 

AAAAATGTGT GCTATGACCA CTTTTTCCCG 

CTGATCTTCG TCTCCACCCC AGCGCTGCTG 

GAAACCACTC GCAAGTTCAG GCGAGGAGAG 

ATTAAAAAGC ACAAGGTTCG GATAGAGGGG 

TTTTTCCGAA TCATCTTTGA AGCAGCCTTT 

TACCACCTGC CCTGGGTGTT GAAATGTGGG 

TTTATTTCTA GGCCAACAGA GAAGACCGTG 

ATTTGCATGC TGCTTAACGT GGCAGAGTTG 

AGATCAAAGA GAGCACAGAC GCAAAAAAAT 

CAGAATGAAA TGAATGAGCT GATTTCAGAT 

AGCTAA 



83 .1 



31 41 51 

1 i I 

GGGGGTGTCA ACAAACACTC CACCAGCATC 

TTCCGAGTCA TGATCCTAGT GGTGGCTGCC 

TTCGTCTGCA ACACACTGCA ACCGGGATGC 

GTGT CCCACA TCCGGCTGTG GGCCCTCCAG 

GTGGCCATGC ATGTGGCCTA CTACAGGCAC 

AAGAGGAATG ATTTCAAAGA CATAGAGGAC 

TCGCTGTGGT GGACGTACAC CAGCAGCATC 

ATGTATGTGT TTTACTTCCT TTACAATGGG 

ATTGACCCCT GCCCCAACCT TGTTGACTGC 

TTTACCATTT TTATGATTTC TGCGTCTGTG 

TGCTACCTGC TGCTGAAAGT GTGTTTTAGG 

CACCCCAATC ATGCCCTAAA GGAGAGTAAG 

AGTGGTCAAA ATGCAAT CAC AGGTTTCCCA 



Seg ID NO: 54 9 Protein sequence 
Protein Accession #: NP 006774.1 



1 11 21 31 41 51 

I I I I I I 

MDWGTLHTFI GGVNKHSTSI GKVWITVIFI FRVMILWAA QEVWGDEQED FVCNTLQPGC 

KNVCYDHFFP VSHIRLWALQ. LIFVSTPALL VAMHVAYYRH ETTRKFRRGE KRNDFKD I ED 

IKKHKVRIEG SLWWTYTSSI FFRIIFEAAF MYVFYFLYNG YHLPWVLKCG IDPCPNLVDC 

FISRPTEKTV FTIFMISASV ICMLLNVAEL CYLIjLKVCFR RSKRAQTQKN HPNHALKESK 

QNEMNELISD SGQNAITGFP S 



Seq ID NO: 550 DNA sequence 

Nucleic Acid Accession #: NM_002571.1 

Coding sequence: 99.. 587 



1 11 21 31 41 51 

l I I l l I 

CATCCCTCTG GCTCCAGAGC TCAGAGCCAC CCACAGCCGC AGCCATGCTG TGCCTCCTGC 
TCACCCTGGG CGTGGCCCTG GTCTGTGGTG TCCCGGCCAT GGACATCCCC CAGACCAAGC 
AGGACCTGGA GCTCCCAAAG TTGGCAGGGA CCTGGCACTC CATGGCCATG GCGACCAACA 
ACATCTCCCT CATGGCGACA CTGAAGGCCC CTCTGAGGGT CCACATCACC TCACTGTTGC 
CCACCCCCGA GGACAACCTG GAGATCGTTC TGCACAGATG GGAGAACAAC AGCTGTGTTG 
AGAAGAAGGT CCTTGGAGAG AAGACTGGGA AT CC AAAGAA GTTCAAGATC AACTATACGG 
TGGCGAACGA GGCCACGCTG CTCGATACTG ACTACGACAA TTTCCTGTTT CTCTGCCTAC 
AGGACACCAC CACCCCCATC C AG AG CATGA TGTGCCAGTA CCTGGCCAGA GTCCTGGTGG 
AGGACGATGA GAT CATGCAG GGATT CAT CA GGGCTTTCAG GCCCCTGCCC AGGCACCTAT 
GGTACTTGCT GGACTTGAAA CAGATGGAAG AGCCGTGCCG TTTCTAGCTC ACCTCCGCCT 
CCAGGAAGAC CAGACTCCCA CCCTTCCACA CCTCCAGAGC AGTGGGACTT CCTCCTGCCC 
TTTCAAAGAA TAACCACAGC TCAGAAGACG ATGACGTGGT CATCTGTGTC GCCATCCCCT 
TCCTGCTGCA CACCTGCACC ATTGCCATGG GGAGGCTGCT CCCTGGGGGC AGAGTCTCTG 
G CAGAGGTTA TTAATAAACC CTTGGAGCAT G 



Seq ID NO: 551 Protein sequence 
Protein Accession #: NP_002562.1 

1 11 21 31 41 51 

I I I I I I 

MDIPQTKQDL ELPKLAGTWH SMAMATNNIS LMATLKAPLR VHITSLLPTP EDNLEIVLHR 

WENNSCVEKK VLGEKTGNPK KFKINYTVAN EATLLDTDYD NFLFLCLQDT TTPIQSMMCQ 

YLARVLVEDD EIMQGFIRAF RPLPRHLWYL LDLKQMEEPC RF 



Seq ID NO: 552 DNA sequence 

Nucleic Acid Accession #: NM_Q06500.1 

Coding sequence: 27.. 1967 



1 11 

i l 

ACTTGCGTCT CGCCCTCCGG 
TCGCCGCCTG CTGCTGCTGT 
CGCCTGAGCT GGTGGAGGTG 
AGTCCCAAGG CAACCTCAGC 
TCATCTTCCG TGTGCGCCAG 
TCAGCCTCCA GGACAGAGGG 
GCATCTTCTT GTGCCAGGGC 
TCTACAAAGC TCCGGAGGAG 
GTAAGGAGCC TGAGGAGGTC 
TCATCTGGTA CAAGAATGGC 
CGTCCCAGAC TGTGGAGTCG 
TGGTTAAAGA AGACAAAGAT 
GGAACCACAT GAAGGAGTCC 
TGTGGCTGGA AGTGGAGCCC 
GTTTGGCTGA TGGCAACCCT 
GGGAGGCAGA GGAAGAGACA 
AGGAACACAG TGGGCGCTAT 
TGAGTGAACC ACAGGAACTA 
CCCCTGAGAG ACAGGAAGGC 
ACCT CGAGTT CCAGTGGCTG 



21 31 

I I 
CCAAGCATGG GGCTTCCCAG 

CCTCGCGTCG CGGGTGTGCC 

GAAGTGGGCA GCACAGCCCT 

CATGTCGACT GGTTTTCTGT 

GGCCAGGGCC AGAGCGAACC 

GCTACTCTGG CCCTGACTCA 

AAGCGCCCTC GGT CCCAGGA 

CCAAACATCC AGGTCAACCC 

GCTACCTGTG TAGGGAGGAA 

CGGCCTCTGA AGGAGGAGAA 

AGTGGTTTGT ACACCTTGCA 

GCCCAGTTTT ACTGTGAGCT 

AGGGAAGTCA CCGTCCCTGT 

GTGGGAATGC TGAAGGAAGG 

CCACCACACT TCAGCATCAG 

ACCAACGACA ACGGGGTCCT 

GAATGTCAGG CCTGGAACTT 

CTGGTGAACT ATGTGTCTGA 

AGCAGCCTCA CCCTGACCTG 

AGAGAAGAGA CAGACCAGGT 



41 51 

I i 
GCTGGTCTGC GCCTTCTTGC 

CGGAGAGGCT GAGCAGCCTG 

TCTGAAGTGC GGCCTCTCCC 

CCACAAGGAG AAGCGGACGC 

TGGGGAGTAC GAGCAGCGGC 

AGTCACCCCC CAAGACGAGC 

GTACCGCATC CAGCTCCGCG 

CCTGGGCATC CCTGTGAACA 

CGGGTACCCC ATTCCTCAAG 

GAACCGGGTC CACATTCAGT 

GAGTATTCTG AAGGCACAGC 

CAACTACCGG CTGCCCAGTG 

TTTCTACCCG ACAGAAAAAG 

GGACCGCGTG GAAATCAGGT 

CAAGCAGAAC CCCAGCACCA 

GGTGCTGGAG CCTGCCCGGA 

GGACACCATG ATATCGCTGC 

CGTCCGAGTG AGTCCCGCAG 

TGAGGCAGAG AGTAGCCAGG 

GCTGGAAAGG GGGCCTGTGC 
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TTCAGTTGCA TGACCTGAAA CGGGAGGCAG GAGGCGGCTA TCGCTGCGTG GCGTCTGTGC 1260 

CCAGCATACC CGGCCTGAAC CGCACACAGC TGGTCAAGCT GGCCATTTTT GGCCCCCCTT 1320 

GGATGGCATT CAAGGAGAGG AAGGTGTGGG TGAAAGAGAA TATGGTGTTG AATCTGTCTT 1380 

GTGAAGCGTC AGGGCACCCC CGGCCCACCA TCTCCTGGAA CGTCAACGGC ACGGCAAGTG 1440 

AACAAGACCA AGATCCACAG CGAGTCCTGA GCACCCTGAA TGTCCTCGTG ACCCCGGAGC 150 0 

TGTTGGAGAC AGGTGTTGAA TGCACGGCCT CCAACGACCT GGGCAAAAAG ACCAGCATCC 1560 

TCTTCCTGGA GCTGGTCAAT TTAACCACCC TCACACCAGA CTCCAACACA ACCACTGGCC 162 0 

TCAGCACTTC CACTGCCAGT CCTCATACCA GAGCCAACAG CACCTCCACA GAGAGAAAGC 1680 

TGCCGGAGCC GGAGAGCCGG GGCGTGGTCA TCGTGGCTGT GATTGTGTGC ATCCTGGTCC 1740 

TGGCGGTGCT GGGCGCTGTC CTCTATTTCC TCTATAAGAA GGGCAAGCTG CCGTGCAGGC 1800 

GCTCAGGGAA GCAGGAGATC ACGCTGCCCC CGTCT CGTAA GACCGAACTT GTAGTTGAAG 1860 

TTAAGTCAGA TAAGCTCCCA GAAGAGATGG GCCTCCTGCA GGGCAGCAGC GGTGACAAGA 1920 

GGGCTCCGGG AGACCAGGGA GAGAAATACA TCGATCTGAG GCATTAGCCC CGAATCACTT 1980 

CAGCTCCCTT CCCTGCCTGG ACCATTCCCA GCTCCCTGCT CACTCTTCTC TCAGCCAAAG 2 040 

CCTCCAAAGG GACTAGAGAG AAGCCTCCTG CTCCCCTCAC CTGCACACCC CCTTT CAGAG 2100 

GGCCACTGGG TTAGGACCTG AGGACCTCAC TTGGCCCTGC AAGCCGCTTT TCAGGGACCA 2160 

GTCCACCACC ATCTCCTCCA CGTTGAGTGA AGCTCATCCC AAGCAAGGAG CCCCAGTCTC 222 0 

CCGAGCGGGT AGGAGAGTTT CTTGCAGAAC GTGTTTTTTC TTTACACACA TTATGGCTGT 22 8 0 

AAATACCTGG CTCCTGCCAG CAG CTGAGCT GGGTAGCCTC TCTGAGCTGG TTTCCTGCCC 2 34 0 

CAAAGGCTGG CTTCCACCAT CCAGGTGCAC CACTGAAGTG AGGACACACC GGAGCCAGGC 2400 

GCCTGCTCAT GTTGAAGTGC GCTGTTCACA CCCGCTCCGG AGAGCACCCC AGCGGCATCC 24 60 

AGAAGCAGCT GCAGTGTTGC TGCCACCACC CTCCTGCTCG CCTCTTCAAA GTCTCCTGTG 252 0 

ACATTTTTTC TTTGGTCAGA AGCCAGGAAC TGGTGT CATT CCTTAAAAGA TACGTGCCGG 2580 

GGCCAGGTGT GGTGGCTCAC GCCTGTAATC CCAGCACTTT GGGAGGCCGA GGCGGGCGGA 2640 

TCACAAAGTC AGGACGAGAC CAT CCTGGCT AACACGGTGA AACCCTGTCT CTACTAAAAA 2 70 0 

TACAAAAAAA AATTAG CTAG GCGTAGTGGT TGGCACCTAT AGTCCCAGCT ACT CGG AAGG 2 760 

CTGAAGCAGG AGAATGGTAT GAATCCAGGA GGTGGAGCTT GCAGTGAGCC GAGACCGTGC 2 820 

CACTGCACTC CAGCCTGGGC AACACAGCGA GACTCCGTCT CGAGGAAAAA AAAAGAAAAG 2 880 

ACGCGTACCT GCGGTGAGGA AGCTGGGCGC TGTTTTCGAG TTCAGGTGAA TTAGCCTCAA 2940 

TCCCCGTGTT CACTTGCTCC CATAGCCCTC TTGATGGATC ACGTAAAACT GAAAGGCAGC 3 00 0 

GGGGAGCAGA CAAAGATGAG GTCTACACTG TCCTTCATGG GGATTAAAGC TATGGTTATA 3 0 60 

TTAGCACCAA ACTTCTACAA ACCAAGCTCA GGGCCCCAAC CCTAGAAGGG CCCAAATGAG 312 0 

AGAATGGTAC TTAGGGATGG AAAACGGGGC CTGGCTAGAG CTTCGGGTGT GTGTGTCTGT 3180 

CTGTGTGTAT GCATACATAT GTGTGTATAT ATGGTTTTGT CAGGTGTGTA AATTTGCAAA 3240 

TTGTTTCCTT TATATATGTA TGTATATATA TATATGAAAA TATATATATA TATGAAAAAT 3300 

AAAGCTTAAT TGTCCCAGAA AATCATACAT TGCTTTTTTA TTCTACATGG GTACCACAGG 3 3 60 

AACCTGGGGG CCTGTGAAAC TACAACCAAA AGGCACACAA AACCGTTTCC AGTTGGCAGC 3420 

AGAGATCAGG GGTTACCTCT GCTTCTGAGC AAATGGCTCA AGCTCTACCA GAGCAGACAG 3 480 

CTACCCTACT TTTCAGCAGC AAAACGTCCC GTATGACGCA GCACGAAGGG CCTGGCAGGC 3 540 
TGTTAGCAGG AGCTATGTCC CTTCCTATCG TTTCCGTCCA CTT 

Seq ID NO: 553 Protein sequence 
Protein Accession #: NP_006491.1 

1 11 21 31 41 51 

l I l l I I 

GLPRLVCAFL LAACCCCPRV AGVPGEAEQP APBLVEVEVG STALLKCGLS QSQGNLSHVD 60 

WFSVHKEKRT LIFRVRQGQG QSEPGEYEQR LSLQDRGATL ALTQVTPQDE RIFLCQGKRP 120 

RSQEYRIQLR VYKAPEEPNI QVNPLGIPVN SKEPEEVATC VGRNGYPIPQ VIWYKNGRPL 180 

KEEKNRVHIQ SSQTVESSGL YTLQSILKAQ LVKEDKDAQF YCELNYRLPS GNHMKESREV 240 

TVPVFYPTEK VWLEVEPVGM LKEGDRVEIR CLADGNPPPH FSISKQNPST REAEEETTND 300 

NGVLVLE PAR KEHSGRYECQ AWNLDTMISL LSEPQEKLVN YVSDVRVSPA APERQEGSSL 360 

TLTCEAESSQ DLEFQWLREE TDQVLERGPV LQLHDLKREA GGGYRCVASV PSIPGLNRTQ 42 0 

LVKLAIFGPP WMAFKERKVW VKENMVLNLS CEASGHPRPT ISWNVNGTAS EQDQDPQRVL 48 0 

STLNVLVTPE LLETGVECTA SNDLGKNTSI LFLELVNLTT LTPDSNTTTG LSTSTASPHT 540 

RANSTSTERK LPEPESRGW IVAVIVCILV IiAVLGAVLYF LYKKGKLPCR RSGKQEITLP 600 
PSRKTELWE VKSDKLPEEM GLLQGSSGDK RAPGDQGEKY IDLRH 

Seq ID NO: 554 DNA sequence 

Nucleic Acid Accession #: NM_003183.3 

Coding sequence: 165.. 263 9 

1 11 21 31 41 51 

I I ! i I I 

TCGAGCCTGG CGGTAGAATC TTCCCAGTAG GCGGCGCGGG AGGGAAAAGA GGATTGAGGG 60 

GCTAGGCCGG GCGGATCCCG TCCTCCCCCG ATGTGAGCAG TTTTCCGAAA CCCCGTCAGG 12 0 

CGAAGGCTGC CCAGAGAGGT GGAGTCGGTA GCGGGGCCGG GAACATGAGG CAGTCTCTCC 180 

TATTCCTGAC CAGCGTGGTT CCTTTCGTGC TGGCGCCGCG ACCTCCGGAT GACCCGGGCT 240 

TCGGCCCCCA CCAGAGACTC GAGAAGCTTG ATTCTTTGCT CTCAGACTAC GATATTCTCT 3 00 

CTTTATCTAA TATCCAGCAG CATTCGGTAA GAAAAAGAGA TCTACAGACT TCAACACATG 3 60 

TAGAAACACT ACTAACTTTT TCAGCTTTGA AAAGGCATTT TAAATTATAC CTGACATCAA 420 

GTACTGAACG ' TTTTTCACAA AATTTCAAGG TCGTGGTGGT GG AT GGT AAA AACGAAAG CG 480 

AGTACACTGC AAAATGGCAG GACTTCTTCA CTGGACACGT GGTTGGTGAG CCTGACTCTA 540 

GGGTTCTAGC CCACATAAGA GATGATGATG TTATAATCAG AAT CAACACA GATGGGGCCG 600 

AATATAACAT AGAGCCACTT TGGAGATTTG TTAATGATAC CAAAGACAAA AGAATGTTAG 660 

TTTATAAATC TGAAGATATC AAGAATGTTT CACGTTTGCA GTCTCCAAAA GTGTGTGGTT 72 0 

ATTTAAAAGT GGATAATGAA GAGTTGCTCC CAAAAGGGTT AGTAGACAGA GAACCACCTG 780 

AAGAGCTTGT TCATCGAGTG AAAAGAAGAG CTGACCCAGA TCCCATGAAG AACACGTGTA 840 

AATTATTGGT GGTAGCAGAT CATCGCTTCT ACAGATACAT GGGCAGAGGG GAAGAGAGTA 900 

CAACTACAAA TTACTTAATA GAGCTAATTG ACAGAGTTGA TGACATCTAT CGGAACACTT 960 

CATGGGATAA TGCAGGTTTT AAAGGCTATG GAATACAGAT AGAGCAGATT CGCATTCTCA 1020 

AGTCTCCACA AGAGGTAAAA CCTGGTGAAA AG CACT ACAA CATGGCAAAA AGTTACCCAA 1080 

ATGAAGAAAA GGATGCTTGG GATGTGAAGA TGTTG CTAGA GCAATTTAGC TTTGATATAG 1140 

CTGAGGAAGC ATCTAAAGTT TGCTTGGCAC ACCTTTTCAC ATACCAAGAT TTTGATATGG 1200 

GAACTCTTGG ATTAGCTTAT GTTGGCTCTC CCAG AG CAAA CAGCCATGGA GGTGTTTGTC 1260 

CAAAGGCTTA TTATAGCCCA GTTGGGAAGA AAAATATCTA TTTGAATAGT GGTTTGACGA 132 0 

GCACAAAGAA TTATGGTAAA ACCATCCTTA CAAAGGAAGC TGACCTGGTT ACAACTCATG 1380 
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AATTGGGACA TAATTTTGGA 
ATGAGGACCA GGGAGGGAAA 
ACAATAAGAT GTTTTCAAAC 
CCCAGGAGTG TTTTCAAGAA 
GAGAAGAGTG TGATCCTGGC 
GCACGTTGAA GGAAGGTGTC 
AGTTTGAGAC TGCCCAGAAG 
CCTACTGCAC AGGTAATAGC 
TTTGCTTGGA TCTTGGCAAG 
AGCAG CTGGA GTCCTGTGCA 
ACCTTTCTGG CCGCTGTGTG 
AAGGAAAGCC CTGTACAGTA 
AGGATGTAAT TGAACGATTT 
AGTTTTTAGC AGACAACATC 
CTTTCAGCAT TCTTGTCCAT 
CTCTGTTTCA CCCCAGTAAC 
TTATCAAACC CTTTCCTGCG 
CTTCGGCGCC AGCAGCTCCA 
CCAGCACAGA CTCCCATATG 
GCACAGCTGC CAAGTCATTT 
CTGCCTCCTT TAAACTG CAG 
TTAGTTCTCA GCTCTTCTGA 
TCAATCACAG CTTGTATTTT 
TTTGAACTTC CTGCAGGTAA 
TAAGGTGAAA GTGAATCTAC 
TTGACCTGTG GTGCAAAAGC 
TGTAAATTAA TCTTTTATAT 
ATACACTGTA ATGAACCGCT 
ATAGTTTTTT tTTTTTTTTT 
GTATACATTG TATCTAAATT 
CAGGGAAAAT ATATATCTAA 
TAAGACTAAT GCTCAGAACC 
TTGAATTTAT GGAATCTACC 
TTTTATAAGT ATCTTCATGT 
CTATTGGCTG GGAGTGGTGG 
CGCCACTACA CTCCAGCCTG 



PCT/US02/12476 



GCAGAACATG 
TATGTCATGT 
TGCAGTAAAC 
CGCAGCAATA 
ATCATGTATC 
CAGTGCAGTG 
AAGTGCCAGG 
AGTGAGTGCC 
TGTAAGGATG 
TGTAATGAAA 
CCCTATGTCG 
GGATTTTGTG 
TGGGATTTCA 
GTTGGGTCTG 
TGTGTGGATA 
GTCGAAATGC 
CCCCAGACTC 
AAACTGGACC 
GACGAGGATG 
GAGGATCTCA 
CGT CAGAATC 
CTTAAGTGTG 
GTGAAGACTG 
ACAGTTCTTG 
TTATTTTGAG 
AGAAAATACA 
TGATAACAGC 
GAATATGAAG 
TTTTTTTTGC 
GTGGGTCTAT 
ATTTAGAAAT 
TAACCACTAC 
AACTGTTTAG 
ATCCCTGTTA 
CTCATGCCTG 
GGTGACAGAG 



ATCCGGATGG 
ATCCCATAGC 
AATCAAT CTA 
AAGTTTGTGG 
TGAACAACGA 
ACAGGAACAG 
AGGCGATTAA 
CGCCTCCAGG 
GGAAATGCAT 
CTGACAACTC 
ATGCTGAACA 
ACATGAATGG 
TTGACCAGCT 
TCCTGGTTTT 
AGAAATTGGA 
TGAGCAGCAT 
CAGGCCGCCT 
ACCAGAGAAT 
GGTTTGAGAA 
CGGACCATCC 
GTGTTAACAG 
CAAAATATTT 
GGAAGTGACT 
TGTGGTTTGG 
GCTTTCAGGT 
GCTGGATTGG 
ACTGACTAGG 
CATTTGGCAT 
CTTCAACTAA 
TTCTAGTTAT 
CATTTGGGTT 
CTTACAGTGA 
GGCCCTGATT 
CTGATAGGGA 
TAATCCCAGC 
TGAGATCTGC 



TCTAGCAGAA 
TGTGAGTGGC 
TAAGACCATT 
GAACT CGAGG 
CACCTGCTGC 
TCCTTGCTGT 
TGCTACTTGC 
AAATGCTGAA 
CCCTTTCTGC 
CTGCAAGGTG 
AAAGAACTTA 
CAAATGTGAG 
GAGCATCAAT 
CTCCTTGATA 
TAAACAGTAT 
GGATTCTGCA 
GCAGCCTGCC 
GGACACCATC 
GGACCCCTTC 
GGTCGCCAGA 
CAAAGAAACA 
TTATAGATTT 
TAGCAGATGC 
CCCTTCTCCT 
TTTAGTTTTT 
GTTATGAATA 
GAAATGATCA 
TTATTTGTGA 
AAACAAAGGA 
TACCCAGAGT 
AATATGGCTC 
GGGCTATACA 
TGCTGGGCAG 
TACATGTCTT 
ACTTGGAGAG 
CTC 



TGTGCCCCGA 1440 

GATCACGAGA 1500 

GAAAGTAAGG 1560 

GTGGATGAAG 162 0 

AACAGCGACT 1680 

AAAAACTGTC 1740 

AAAGGCGTGT 1800 

AATGACACTG 1860 

GAGAGGGAAC 192 0 

TGCTGCAGGG 1980 

TTTTTGAGGA 2 040 

AAACGAGT AC 2100 

ACTTTTGGAA 2160 

TTTTGGATTC 2220 

GAATCTCTGT 22 80 

TCGGTTCGCA 2 340 

CCTGTGATCC 240 0 

CAGGAAGACC 2 460 

CCAAATAGCA 252 0 

AGTGAAAAGG 2580 

GAGTGCTAAT 2 640 

GACCTACAAA 2700 

TGGT CATGTG 2 760 

TTTGAAAAGG 2 820 

AAAATATCTT 2 8 80 

TTTACGTTTT 2 94 0 

GTTTTTTTTT 3 0 0 0 

GAAAAGTGGA 3 060 

GATAAATTTA 312 0 

TTTTATGTAG 3180 

TTCATAATTC 3240 

TGGTAGCCAG 3 3 00 

TTTTTCTGTA 3 3 60 

AGAAAATTCA 3 42 0 

GCTGAGGTTG 3 480 



40 



Seq ID NO: 555 Protein sequence 
Protein Accession #: NP 003174.2 



45 



50 



55 



1 

I 

MRQSLLFLTS 
QTSTHVETLL 
GEPDSRVLAH 
PKVCGYLKVD 
RGEESTTTNY 
AKSYPNEEKD 
HGGVCPKAYY 
AECAPNEDQG 
SRVDEGEECD 
TCKGVSYCTG 
KVCCRDhSGR 
INTFGKFLAD 
SASVRIIKPF 
PFPNSSTAAK 



11 



21 



31 



WPFVLAPRP 
TFSALKRHFK 
IRDDDVIIRI 
NEELLPKGLV 
LIELIDRVDD 
AWDVKMLLEQ 
SPVGKKNIYL 
GKYVMYP I AV 
PGIMYLNNDT 
NSSECPPPGN 
CVPYVDAEQK 
NIVGSVLVFS 
PAPQTPGRLQ 
SFEDLTDHPV 



PDDPGFGPHQ 
LYLTSSTERF 
NTDGAEYNIE 
DREPPEELVH 
IYRNTSWDNA 
FSFDIAEEAS 
NSGLTSTKNY 
SGDHENNKMF 
CCNSDCTLKE 
AENDTVCLDL 
NLFLRKGKPC 
LIFWIPFSIL 
PAPVIPSAPA 
ARSEKAASFK 



RLEKLDSLLS 
SQNFKWWD 
PLWRFVNDTK 
RVKRRADPDP 
GFKGYGIQIE 
KVCLAHLFTY 
GKTILTKEAD 
SNCSKQSIYK 
GVQCSDRNSP 
GKCKDGKCIP 
TVGFCDMNGK 
VHCVDKKLDK 
APKLDHQRMD 
LQRQNRVNSK 



41 

I 

DYDILSLSNI 
GKNESEYTAK 
DKRMLVYKSE 
MKNTCKLLW 
QIRILKSPQE 
QDFDMGTLGL 
LVTTHELGHN 
TIESKAQECF 
CCKNCQFETA 
FCEREQQLES 
CEKRVQDVIE 
QYESLSLFHP 
TIQEDPSTDS 
ETEC 



51 



QQHSVRKRDL 60 

WQDFFTGHW 120 

DIKNVSRLQS 180 

ADHRFYRYMG 240 

VKPGEKHYNM 3 0 0 

AYVGS PRAMS 3 60 

FGAEHDPDGL 42 0 

QERSNKVCGN 480 

QKKCQEAINA 540 

CACNETDNSG 60 0 

RFWDFIDQLS 660 

SNVEMLSSMD 72 0 

HMDEDGFEKD 780 



60 



Seq ID NO: 556 DNA sequence 

Nucleic Acid Accession #: NM_021832.1 

Coding sequence: 164.. 2248 



65 



70 



75 



80 



85 



TCGAGCCTGG 
CTAGGCCGGG 
GAAGGCTGCC 
ATTCCTGACC 
CGGCCCCCAC 
TTTATCTAAT 
AGAAACACTA 
TACTGAACGT 
GTACACTGTA 
GGTTCTAGCC 
ATATAACATA 
TTATAAATCT 
TTTAAAAGTG 
AGAGCTTGTT 
ATTATTGGTG 
AACTACAAAT 
ATGGGATAAT 
GTCTCCACAA 
TGAAGAAAAG 
TGAGGAAGCA 
AACTCTTGGA 
AAAGGCTTAT 
CACAAAGAAT 
ATTGGGACAT 



11 
I 

CGGTAGAATC 
CGGATCCCGT 
CAGAGAGGTG 
AGCGTGGTTC 
CAGAGACTCG 
ATCCAGCAGC 
CTAACTTTTT 
TTTTCACAAA 
AAATGGCAGG 
CACATAAGAG 
GAGCCACTTT 
GAAGATATCA 
GATAATGAAG 
CAT CGAGTGA 
GTAGCAGATC 
TACTTAATAG 
GCAGGTTTTA 
GAGGTAAAAC 
GATGCTTGGG 
TCTAAAGTTT 
TTAGCTTATG 
TATAGCCCAG 
TATGGTAAAA 
AATTTTGGAG 



21 



TTCCCAGTAG 
CCTCCCCCGA 
GAGTCGGTAG 
CTTTCGTGCT 
AGAAGCTTGA 
ATTCGGTAAG 
CAGCTTTGAA 
ATTTCAAGGT 
ACTTCTTCAC 
ATGATGATGT 
GGAGATTTGT 
AG AATGTTT C 
AGTTGCTCCC 
AAAGAAGAGC 
ATCGCTTCTA 
AG CTAATTG A 
AAGGCTATGG 
CTGGTGAAAA 
ATGTGAAGAT 
GCTTGGCACA 
TTGGCTCTCC 
TTGGGAAGAA 
CCATCCTTAC 
CAGAACATGA 



31 
I 

GCGGCGCGGG 
TGTGAGCAGT 
CGGGGCCGGG 
GGCGCCGCGA 
TTCTTTGCTC 
AAAAAGAGAT 
AAGGCATTTT 
CGTGGTGGTG 
TGGACACGTG 
TATAATCAGA 
TAATGATACC 
ACGTTTGCAG 
AAAAGGGTTA 
TGACCCAGAT 
CAGATACATG 
CAGAGTTGAT 
AATACAGATA 
GCACTACAAC 
GTTGCTAGAG 
CCTTTTCACA 
CAG AG CAAAC 
AAATATCTAT 
AAAGGAAGCT 
TCCGGATGGT 



41 

1 

AGGAAAAGAG 
TTTCCGAAAC 
AACATGAGGC 
CCTCCGGATG 
TCAGACTACG 
CTACAGACTT 
AAATTATACC 
GATGGTAAAA 
GTTGGTGAGC 
ATCAACACAG 
AAAGACAAAA 
TCTCCAAAAG 
GTAGACAGAG 
CCCATGAAGA 
GGCAGAGGGG 
GACATCTATC 
GAGCAGATTC 
ATGGCAAAAA 
CAATTTAGCT 
TACCAAGATT 
AGCCATGGAG 
TTGAATAGTG 
GACCTGGTTA 
CTAGCAGAAT 



51 
I 

GATTGAGGGG 60 

CCCGTCAGGC 12 0 

AGTCTCTCCT 180 

ACCCGGGCTT 240 

ATATTCTCTC 3 00 

CAACACATGT 360 

TGACATCAAG 42 0 

ACGAAAGCGA 480 

CTGACTCTAG 540 

ATGGGGCCGA 600 

GAATGTTAGT 660 

TGTGTGGTTA 720 

AACCACCTGA 780 

ACACGTGTAA 840 

AAGAGAGTAC 900 

GGAACACTTC 960 

GCATTCTCAA 1020 

GTTACCCAAA 1080 

TTGATATAGC 1140 

T TGATATGGG 1200 

GTGTTTGTCC 1260 

GTTTGACGAG 132 0 

CAACTCATGA 13 80 

GTGCCCCGAA 1440 
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TGAGGACCAG GGAGGGAAAT ATGTCATGTA TCCCATAGCT GTGAGTGGCG ATCACGAGAA 1500 

CAATAAGATG TTTTCAAACT GCAGTAAACA ATCAATCTAT AAGACCATTG AAAGTAAGGC 1560 

CCAGGAGTGT TTTCAAGAAC GCAG CAATAA AGTTTGTGGG AACTCGAGGG TGGATGAAGG 1620 

AGAAGAGTGT GATCCTGGCA TCATGTATCT GAACAACGAC ACCTGCTGCA ACAGCGACTG 1680 

CACGTTGAAG GAAGGTGTCC AGTGCAGTGA CAGGAACAGT CCTTGCTGTA AAAACTGTCA 1740 

GTTTGAGACT GCCCAGAAGA AGTGCCAGGA GGCGATTAAT GCTACTTGCA AAGGCGTGTC 180 0 

CTACTGCACA GGTAATAGCA GTGAGTGCCC GCCTCCAGGA AATGCTGAAG ATGACACTGT 1860 

TTGCTTGGAT CTTGGCAAGT GTAAGGATGG GAAATGCATC CCTTTCTGCG AGAGGGAACA 192 0 

GCAGCTGGAG TCCTGTGCAT GTAATGAAAC TGACAACTCC TGCAAGGTGT GCTGCAGGGA 1980 

CCTTTCCGGC CGCTGTGTGC CCTATGTCGA TGCTGAACAA AAGAACTTAT TTTTGAGGAA 2 040 

AGGAAAGCCC TGTACAGTAG GATTTTGTGA CATGAATGGC AAATGTGAGA AACGAGTACA 2100 

GGATGTAATT GAACGATTTT GGGATTTCAT TGACCAGCTG AGCATCAATA CTTTTGGAAA 2160 

GTTTTTAGCA GACAACATCG TTGGGTCTGT CCTGGTTTTC TCCTTGATAT TTTGGATTCC 2220 

TTTCAGCATT CTTGTCCATT GTGTGTAACG TCGAAATGCT GAGCAGCATG GATTCTGCAT 22 80 

CGGTTCGCAT TATCAAACCC TTTCCTGCGC CCCAGACTCC AGGCCGCCTG CAGCCTGCCC 2340 

CTGTGATCCC TTCGGCGCCA GCAGCTCCAA AACTGGACCA CCAGAGAATG GACACCATCC 2400 

AGGAAGACCC CAGCACAGAC TCACATATGG ACGAGGATGG GTTTGAGAAG GACCCCTTCC 2460 

CAAATAGCAG CACAGCTGCC AAGT CATTTG AGGATCTCAC GGACCATCCG GTCACCAGAA 2520 

GTGAAAAGGC TGCCTCCTTT AAACTGCAGC GTCAGAATCG TGTTGACAGC AAAGAAACAG 25 80 

AGTGCTAATT TAGTTCTCAG CTCTTCTGAC TTAAGTGTGC AAAATATTTT TATAGATTTG 2 640 

ACCTACAATC AATCACAGCT TATATTTTGT GAAGACTGGG AAGTGACTTA GCAGATGCTG 2700 

GTCATGTGTT TGAACTTCCT GCAGGTAAAC AGTTCTTGTG TGGTTTGGCC CTTCTCCTTT 2 760 

TGAAAAGGTA AGGTGAAGGT GAATCTAGCT TATTTTGAGG CTTTCAGGTT TTAGTTTTTA 2 82 0 

AAATATCTTT TGACCTGTGG TGCAAAAGCA GAAAATACAG CTGGATTGGG TTATGAGTAT 2 880 

TTACGTTTTT GTAAATTAAT CTTTTATATT GATAACAGGC ACTGACTAGG GAAATGATCA 2 940 

GTTTTTTTTT ATACACTGTA ATGAACCGCT GAATATGAAG CATTTGGCAT TTATTTGTGA 3000 

GAAAAGTGGA ATAGTTTTTT TTTTTTTTTT TTTTTTTTGC CTTCAACTAA AAACAAAGGA 3060 

GATAAATTTA GTATACATTG TATCTAAATT GTGGGTCTAT TTCTAGTTAT TACCCAGAGT 312 0 

TTTTATGTAG CAGGGAAAAT ATATATCTAA ATTTAGAAAT CATTTGGGTT AATATGGCTC 3180 

TTCATAATTC TAAGACTAAT GCTCAGAACC TAACCACTAC CTTACAGTGA GGG C TAT AC A 3 2 40 

TGGTAG CCAG TTGAATTTAT GGAAT CTACC AACTGTTTAG GGCCCTGATT TGCTGGGCAG 3300 

TTTTTCTGTA TTTTATAAGT ATCTTCATGT ATCCCTGTTA CTGATAGGGA TACATGTCTT 33 60 

AGAAAATTCA CTATTGGCTG GGAGTGGTGG CTCATGCCTG TAATCCCAGC ACTTGGAGAG 3420 
3421 GCTGAGGTTG CGCCACTACA CTCCAGCCTG GGTGACAGAG TGAGATCTGC CTC 
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40 



45 



50 



MRQSLLFLTS 
QTSTHVETLL 
GEPDSRVLAH 
PKVCGYLKVD 
RGEESTTTNY 
AKSYPNEEKD 
HGGVCPKAYY 
AECAPNEDQG 
SRVDEGEECD 
TCKGVSYCTG 
KVCCRDLSGR 
INTFGKFLAD 



11 
I 

WPFVLAPRP 
TFSALKRHFK 
IRDDDVIIRI 
NEELLPKGLV 
LIELIDRVDD 
AWDVKMLLEQ 
SPVGKKNIYL 
GKYVMYP I AV 
PGIMYLNNDT 
NSSECPPPGN 
CVPYVDAEQK 
NIVGSVLVFS 



21 
I 

PDDPGFGPHQ 
LYLTSSTERF 
NTDGAEYNIE 
DREPPEELVH 
I YRNTSWDNA 
FSFDIAEEAS 
NSGLTSTKNY 
SGDHENNKMF 
CCNSDCTLKE 
AEDDTVCLDL 
NLFLRKGKPC 
LIFWIPFSIL 



31 



RLEKLDSLLS 
SQNFKWWD 
PLWRFVNDTK 
RVKRRADPDP 
GFKGYGIQIE 
KVCLiAHLFTY 
GKTILTKEAD 
SNCSKQSIYK 
GVQCSDRNSP 
GKCKDGKC I P 
TVG F CDMNGK 
VHCV 



41 

I 

DYDILSLSNI 
GKNESEYTVK 
DKRMLVYKSE 
MKNTCKIiLW 
QIRILKSPQE 
QDFDMGTLGL 
IiVTTHELGHN 
TIESKAQECF 
CCKNCQFETA 
FCEREQQLES 
CEKRVQDVIE 



51 



QQHSVRKRDL 60 

WQDFFTGHW 120 

DIKNVSRLQS 180 

ADHRFYRYMG 240 

VKPGEKHYNM 3 00 

AYVGS PRANS 3 60 

FGAEHDPDGL 420 

QERSNKVCGN 480 

QKKCQEAINA 540 
CACNETDNSC • 600 

RFWDFIDQLS 660 
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60 



65 



70 



75 



80 



85 



I 

AGACACCTCT 
GGGCTGCTGC 
CCTGAGAACC 
CACTCGGGTG 
CCAGAAGCAA 
GCGAACCCCA 
CAAGTGGCAC 
GGCGGTGATT 
CACCTTCACT 
GCACGGAGAC 
TGGCCCCGGC 
GGGCGT CGTG 
CATCTTCGAG 
CTGGTGCAGT 
GAGACTCTAC 
CCAAGGCCAA 
CGCCACCACC 
CTCGACGGTG 
GGGTAAGGAG 
TACCACCTCG 
TTTGTTCCTC 
GCCGGAGGCG 
CGACGTGAAT 
AACCACCACC 
TGTCCACCCC 
AGGTCCCCCC 
TGCCTGCAAC 
CAAGGATGGG 



11 

t 

GCCCTCACCA 
TTTGCTGCCC 
AATCTCACCG 
GCAGAGATGC 
CTGTCCCTGC 
CGGTGCGGGG 
CACCACAACA 
GACGACGCCT 
CGCGTGTACA 
GGGTATCCCT 
ATTCAGGGAG 
GTTCCAACTC 
GGCCGCTCCT 
ACCACGGCCA 
ACCCGGGACG 
TCCTACTCCG 
GCCAACTACG 
ATGGGGGGCA 
TACTCGACCT 
AACTTTGACA 
GTGGCGGCGC 
CTCATGTACC 
GGCATCCGGC 
ACACCGCAGC 
TCAGAGCGCC 
ACTGCTGGCC 
GTGAACATCT 
AAGTACTGGC 



21 
I 

TGAGCCTCTG 
CCAGACAGCG 
ACAGGCAGCT 
GTGGAGAGTC 
CCGAGACCGG 
TCCCAGACCT 
TCACCTATTG 
TTGCCCGCGC 
GCCGGGACGC 
TCGACGGGAA 
ACGCCCATTT 
GGTTTGGAAA 
ACTCTGCCTG 
ACTACGACAC 
GCAATGCTGA 
CCTGCACCAC 
ACCGGGACAA 
ACTCGGCGGG 
GTACCAGCGA 
GCGACAAGAA 
ATGAGTT CGG 
CTATGTACCG 
ACCTCTATGG 
CCACGGCTCC 
CCACAGCTGG 
CTTCTACGGC 
TCGACGCCAT 
GATTCTCTGA 



31 



GCAGCCCCTG 
CCAGTCCACC 
GGCAGAGGAA 
GAAATCTCTG 
TGAGCTGGAT 
GGGCAGATTC 
GATCCAAAAC 
CTTCGCACTG 
AGACATCGTC 
GGACGGGCTC 
CGACGATGAC 
CGCAGATGGC 
CACCACCGAC 
CGACGACCGG 
TGGGAAACCC 
GGACGGT CGC 
GCTCTTCGGC 
GGAGCTGTGC 
GGGCCGCGGA 
GTGGGGCTTC 
CCACGCGCTG 
CTTCACTGAG 
TCCTCGCCCT 
CCCGACGGTC 
CCCCACAGGT 
CACTACTGTG 
CGCGGAGATT 
GGGCAGGGGG 



41 

I 

GTCCTGGTGC 
CTTGTGCTCT 
TACCTGTACC 
GGGCCTGCGC 
AGCGCCACGC 
CAAACCTTTG 
TACT CGG AAG 
TGGAGCGCGG 
ATCCAGTTTG 
CTGGCACACG 
GAGTTGTGGT 
GCGGCCTGCC 
GGTCGCTCCG 
TTTGGCTTCT 
TGCCAGTTTC 
TCCGACGGCT 
TTCTGCCCGA 
GTCTTCCCCT 
GATGGGCGCC 
TGCCCGGACC 
GGCTTAGATC 
GGGCCCCCCT 
GAACCTGAGC 
TGCCCCACCG 
CCCCCCTCAG 
CCTTTGAGTC 
GGGAACCAGC 
AGCCGGCCGC 



51 

I 

TCCTGGTGCT 60 

TCCCTGGAGA 120 

GCTATGGTTA 180 

TGCTGCTTCT 240 

TGAAGGCCAT 3 00 

AGGGCGACCT 360 

ACTTGCCGCG 420 

TGACGCCGCT 480 

GTGTCGCGGA 540 

CCTTTCCTCC 600 

CCCTGGGCAA 660 

ACTTCCCCTT 720 

ACGGCTTGCC 780 

GCCCCAGCGA 840 

CATTCATCTT 900 

ACCGCTGGTG 960 

CCCGAGCTGA 1020 

TCACTTTCCT 1080 

TCTGGTGCGC 1140 

AAGGATACAG 1200 

ATTCCTCAGT 1260 

TGCATAAGGA 1320 

CACGGCCTCC 1380 

GACCCCCCAC 1440 

CTGGCCCCAC 1500 

CGGTGGACGA 1560 

TGTATTTGTT 1620 

AGGGCCCCTT 1680 



397 



WO 02/086443 

CCTTATCGCC GACAAGTGGC CCGCGCTGCC CCGCAAGCTG GACTCGGTCT TTGAGGAGCC 1740 

GCTCTCCAAG AAGCTTTTCT TCTTCTCTGG GCGCCAGGTG TGGGTGTACA CAGGCGCGTC 180 0 

GGTGCTGGGC CCGAGGCGTC TGGACAAGCT GGGCCTGGGA GCCGACGTGG CCCAGGTGAC 18 60 

CGGGGCCCTC CGGAGTGGCA GGGGGAAGAT GCTGCTGTTC AGCGGGCGGC GCCTCTGGAG 192 0 

GTTCGACGTG AAGGCGCAGA TGGTGGATCC CCGGAGCGCC AGCGAGGTGG ACCGGATGTT 1980 

CCCCGGGGTG CCTTTGGACA CGCACGACGT CTTCCAGTAC CGAGAGAAAG CCTATTTCTG 2040 

CCAGGACCGC TTCTACTGGC GCGTGAGTTC CCGGAGTGAG TTGAACCAGG TGGACCAAGT 2100 

GGGCTACGTG ACCTATGACA TCCTGCAGTG CCCTGAGGAC TAGGGCTCCC GTCCTGCTTT 2160 

GCAGTGCCAT GTAAATCCCC ACTGGGACCA ACCCTGGGGA AGGAGCCAGT TTGCCGGATA 2220 

CAAACTGGTA TTCTGTTCTG GAGGAAAGGG AGGAGTGGAG GTGGGCTGGG CCCTCTCTTC 2280 
TCACCTTTGT TTTTTGTTGG AGTGTTTCTA ATAAACTTGG ATTCTCTAAC CTTT 

Seq ID NO: 559 Protein sequence 
Protein Accession #: NP_004985.1 

1 11 21 31 41 51 

I I ! I I ! 

MSLWQPLVLV LLVLGCCFAA PRQRQSTLVL FPGDLRTNLT DRQLAEEYLY RYGYTRVAEM 60 

RGESKSLGPA LLLLQKQLSL PETGELDSAT LKAMRTPRCG VPDLGRFQTF EGDLKWHHHN 120 

ITYWIQNYSE DLPRAVIDDA FARAFALWSA VTPLTFTRVY SRDADIVIQF GVAEHGDGYP 180 

FDGKDGLLAH AFPPGPGIQG D AH FDDDELW SLGKGVWPT RFGNADGAAC HFPFIFEGRS 2 40 

YSACTTDGRS DGLPWCSTTA NYDTDDRFGF CPSERLYTRD GNADGKPCQF PFIFQGQSYS 3 00 

ACTTDGRSDG YRWCATTANY DRDKLFGFCP TRAD S TVMGG NSAGELCVFP FTFLGKEYST 3 60 

CTSEGRGDGR LWCATTSNFD SDKKWGFCPD QGYSLFLVAA HEFGHALGLD HSSVPEALMY 42 0 

PMYRFTEGPP LHKDDVNGIR HLYGPRPEPE PRPPTTTTPQ PTAPPTVCPT GPPTVHPSER 480 

PTAGPTGPPS AGPTGPPTAG PSTATTVPLS PVDDACNVNI FDAIAEIGNQ LYLFKDGKYW 540 

RFSEGRGSRP QGPFLIADKW PALPRKLDSV FEEPLSKKLF FFSGRQVWVY TGASVLGPRR 60 0 

LDKLGLGADV AQVTGALRSG RGKMLIiFSGR RLWRFDVKAQ MVDPRSASEV DRMFPGVPLD 660 
THDVFQYREK AYFCQDRFYW RVSSRSELNQ VDQVGYVTYD ILQCPED 

Seq ID NO: 560 DNA sequence 

Nucleic Acid Accession #: NM_000213.1 

Coding sequence: 127.. 5385 

1 11 21 31 41 51 

111)11 

CGCGCGCGCG CTGCAGCCCC ATCTCCTAGC GGCAGCCCAG GCGCGGAGGG AGCGAGTCCG 60 

CCCCGAGGTA GGTCCAGGAC GGGCGCACAG CAGCAGCCGA GGCTGGCCGG GAGAGGGAGG 12 0 

AAGAGGATGG CAGGGCCACG CCCCAGCCCA TGGGCCAGGC TGCTCCTGGC AGCCTTGATC 180 

AGCGTCAGCC TCTCTGGGAC CTTGGCAAAC CGCTGCAAGA AGGCCCCAGT GAAGAGCTGC 240 

ACGGAGTGTG TCCGTGTGGA TAAGGACTGC GCCTACTGCA CAGACGAGAT GTT CAGGGAC 3 00 

CGGCGCTGCA ACACCCAGGC GGAGCTGCTG GCCGCGGGCT GCCAGCGGGA GAGCATCGTG 3 60 

GTCATGGAGA GCAGCTTCCA AATCACAGAG GAGACCCAGA TTGACACCAC CCTGCGGCGC 420 

AGCCAGATGT CCCCCCAAGG CCTGCGGGTC CGTCTGCGGC CCGGTGAGGA GCGGCATTTT 480 

GAGCTGGAGG TGTTTGAGCC ACTGGAGAGC CCCGTGGACC TGTACATCCT CATGGACTTC 540 

TCCAACTCCA TGTCCGATGA TCTGGACAAC CTCAAGAAGA TGGGG CAGAA CCTGGCTCGG 600 

GTCCTGAGCC AGCTCACCAG CGACTACACT ATTGGATTTG GCAAGTTTGT GGACAAAGTC 660 

AGCGTCCCGC AGACGGACAT GAGGCCTGAG AAGCTGAAGG AGCCCTGGCC CAACAGTGAC 720 

CCCCCCTTCT CCTTCAAGAA CGT CATC AGC CTGACAGAAG ATGTGGATGA GTTCCGGAAT 780 

AAACTGCAGG GAGAGCGGAT CTCAGGCAAC CTGGATGCTC CTGAGGGCGG CTTCGATGCC 840 

ATCCTGCAGA CAGCTGTGTG CACGAGGGAC ATTGGCTGGC GCCCGGACAG CACCCACCTG 900 

CTGGTCTTCT CCACCGAGTC AGCCTTCCAC TATGAGGCTG ATGGCGCCAA CGTGCTGGCT 960 

GGCAT CATGA GCCGCAACGA TGAACGGTGC CACCTGGACA CCACGGGCAC CTACACCCAG 102 0 

TACAGGACAC AGGACTACCC GTCGGTGCCC ACCCTGGTGC GCCTGCTCGC CAAGCACAAC 1080 

ATCATCCCCA TCTTTGCTGT CACCAACTAC TCCTATAGCT ACTACGAGAA GCTTCACACC 1140 

T AT TTCCCTG TCTCCTCACT GGGGGTGCTG CAGGAGGACT CGTCCAACAT CGTGGAGCTG 12 00 

CTGGAGGAGG CCTTCAATCG GATCCGCTCC AACCTGGACA TCCGGGCCCT AGACAGCCCC 12 60 

CGAGGCCTTC GGACAGAGGT CACCTCCAAG ATGTTCCAGA AGACGAGGAC TGGGTCCTTT 132 0 

CACATCCGGC GGGGGGAAGT GGGTATATAC CAGGTGCAGC TGCGGGCCCT TGAGCACGTG 13 80 

GATGGGACGC ACGTGTGCCA GCTGCCGGAG GACCAGAAGG GCAACATCCA TCTGAAACCT 1440 

TCCTTCTCCG ACGGCCTCAA GATGGACGCG GGCATCATCT GTGATGTGTG CACCTGCGAG 1500 

CTGCAAAAAG AGGTGCGGTC AGCTCGCTGC AGCTTCAACG GAGACTTCGT GTGCGGACAG 1560 

TGTGTGTGCA GCGAGGGCTG GAGTGGCCAG ACCTGCAACT GCTCCACCGG CTCTCTGAGT 162 0 

GACATTCAGC CCTGCCTGCG GGAGGGCGAG GACAAGCCGT GCTCCGGCCG TGGGGAGTGC 1680 

CAGTGCGGGC ACTGTGTGTG CTACGGCGAA GGCCGCTACG AGGGTCAGTT CTGCGAGTAT 1740 

GACAACTTCC AGTGTCCCCG CACTTCCGGG TTCCTCTGCA ATGACCGAGG ACGCTGCTCC 180 0 

ATGGGCCAGT GTGTGTGTGA GCCTGGTTGG ACAGGCCCAA GCTGTGACTG TCCCCTCAGC 1860 

AATGCCACCT GCATCGACAG CAATGGGGGC ATCTGTAATG GACGTGGCCA CTGTGAGTGT 192 0 

GGCCGCTGCC ACTGCCACCA GCAGTCGCTC TACACGGACA CCATCTGCGA GAT CAACTAC 1980 

TCGGCGATCC ACCCGGGCCT CTG CGAGGAC CTACGCTCCT GCGTGCAGTG CCAGGCGTGG 2 040 

GGCACCGGCG AGAAGAAGGG . GCGCACGTGT GAGGAATGCA ACTTCAAGGT CAAGATGGTG 2100 

GACGAGCTTA AGAGAGCCGA GGAGGTGGTG GTGCGCTGCT CCTTCCGGGA CGAGGATGAC 2160 

GACTGCACCT ACAGCTACAC CATGGAAGGT GACGGCGCCC CTGGGCCCAA CAGCACTGTC 222 0 

CTGGTGCACA AGAAGAAGGA CTGCCCTCCG GGCTCCTTCT GGTGGCTCAT CCCCCTGCTC 2280 

CTCCTCCTCC TGCCGCTCCT GGCCCTGCTA CTGCTGCTAT GCTGGAAGTA CTGTGCCTGC 2340 

TGCAAGGCCT GCCTGGCACT TCTCCCGTGC TGCAACCGAG GT CACATGGT GGGCTTTAAG 2400 

GAAGACCACT ACATGCTGCG GGAGAACCTG ATGGCCTCTG ACCACTTGGA CACGCCCATG 2460 

CTGCGCAGCG GGAACCTCAA GGGCCGTGAC GTGGTCCGCT GGAAGGTCAC CAACAACATG 252 0 

CAGCGGCCTG GCTTTGCCAC TCATGCCGCC AGCATCAACC CCACAGAGCT GGTGCCCTAC 2580 

GGGCTGTCCT TGCGCCTGGC CCGCCTTTGC ACCGAGAACC TGCTGAAGCC TGACACTCGG 2 640 

GAGTGCGCCC AGCTGCGCCA GGAGGTGGAG GAGAACCTGA ACGAGGTCTA CAGGCAGATC 2700 

TCCGGTGTAC ACAAGCTCCA GCAGACCAAG TTCCGGCAGC AGCCCAATGC CGGGAAAAAG 2760 

CAAGACCACA CCATTGTGGA CACAGTGCTG ATGGCGCCCC GCTCGGCCAA GCCGGCCCTG 282 0 

CTGAAGCTTA CAGAGAAGCA GGTGGAACAG AGGGCCTTCC ACGACCTCAA GGTGGCCCCC 2880 

GGCTACTACA CCCTCACTGC AGACGAGGAC GCCCGGGGCA TGGTGGAGTT CCAGGAGGGC 2 940 

GTGGAGCTGG TGGACGTACG GGTGCCCCTC TTTATCCGGC CTGAGGATGA CGACGAGAAG 3000 

CAGCTGCTGG TGGAGGCCAT CGACGTGCCC GCAGGCACTG CCACCCTCGG CCGCCGCCTG 3 060 
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GTAAACATCA CCATCATCAA GGAGCAAGCC AGAGACGTGG TGTCCTTTGA GCAGCCTGAG 3120 

TTCTCGGTCA GCCGCGGGGA CCAGGTGGCC CGCATCCCTG TCATCCGGCG TGTCCTGGAC 3180 

GGCGGGAAGT CCCAGGTCTC CTACCGCACA CAGGATGGCA CCGCGCAGGG CAACCGGGAC 3240 

TACATCCCCG TGGAGGGTGA GCTGCTGTTC CAGCCTGGGG AGGCCTGGAA AGAGCTGCAG 3300 

GTGAAGCTCC TGGAGCTGCA AGAAGTTGAC TCCCTCCTGC GGGGCCGCCA GGTCCGCCGT 3360 

TTCCACGTCC AGCTCAGCAA CCCTAAGTTT GGGGCCCACC TGGGCCAGCC CCACTCCACC 3420 

ACCATCATCA TCAGGGACCC AGATGAACTG GACCGGAGCT TCACGAGTCA GATGTTGTCA 3480 

TCACAGCCAC CCCCTCACGG CGACCTGGGC GCCCCGCAGA ACCCCAATGC TAAGGCCGCT 3540 

GGGTCCAGGA AGATCCATTT CAACTGGCTG CCCCCTTCTG GCAAGCCAAT GGGGTACAGG 3 600 

GTAAAGTACT GGATTCAGGG TGACTCCGAA TCCGAAGCCC ACCTGCTCGA CAGCAAGGTG 3660 

CCCTCAGTGG AGCTCACCAA CCTGTACCCG TATTGCGACT ATGAGATGAA GGTGTGCGCC 3720 

TACGGGGCTC AGGGCGAGGG ACCCTACAGC TCCCTGGTGT CCTGCCGCAC CCACCAGGAA 3780 

GTGCCCAGCG AGCCAGGGCG TCTGGCCTTC AATGT CGTCT CCTCCACGGT GACCCAGCTG 3840 

AGCTGGGCTG AGCCGGCTGA GACCAACGGT GAGATCACAG CCTACGAGGT CTGCTATGGC 3900 

CTGGTCAACG ATGACAACCG ACCTATTGGG CCCATGAAGA AAGTGCTGGT TGACAACCCT 3960 

AAGAACCGGA TGCTGCTTAT TGAGAACCTT CGGGAGTCCC AGCCCTACCG CTACACGGTG 402 0 

AAGGCGCGCA ACGGGGCCGG CTGGGGGCCT GAGCGGGAGG CCATCATCAA CCTGGCCACC 4080 

CAGCCCAAGA GGCCCATGTC CATCCCCATC ATCCCTGACA TCCCTATCGT GGACGCCCAG 4140 

AGCGGGGAGG ACTACGACAG CTTCCTTATG TACAGCGATG ACGTTCTACG CTCTCCATCG 4200 

GGCAGCCAGA GGCCCAGCGT CTCCGATGAC ACTGAGCACC TGGTGAATGG CCGGATGGAC 42 60 

TTTGCCTTCC CGGGCAGCAC CAACTCCCTG CACAGGATGA CCACGACCAG TGCTGCTGCC 432 0 

TATGGCACCC ACCTGAGCCC ACACGTGCCC CACCGCGTGC TAAG CACATC CTCCACCCTC 43 80 

ACACGGGACT ACAACTCACT GACCCGCTCA GAACACTCAC ACTCGACCAC ACTGCCGAGG 4440 

GACTACTCCA CCCTCACCTC CGTCTCCTCC CACGACTCTC GCCTGACTGC TGGTGTGCCC 4500 

GACACGCCCA CCCGCCTGGT GTTCTCTGCC CTGGGGCCCA CATCTCTCAG AGTGAGCTGG 4560 

CAGGAGCCGC GGTGCGAGCG GCCGCTGCAG GGCTACAGTG TGGAGTACCA GCTGCTGAAC 462 0 

GGCGGTGAGC TGCATCGGCT CAACATCCCC AACCCTGCCC AGACCTCGGT GGTGGTGGAA 4680 

GACCTCCTGC CCAACCACTC CTACGTGTTC CGCGTGCGGG CCCAGAGCCA GGAAGGCTGG 4740 

GGCCGAGAGC GTGAGGGTGT CATCACCATT GAAT CCCAGG TGCACCCGCA GAGCCCACTG 4800 

TGTCCCCTGC CAGGCTCCGC CTTCACTTTG AGCACTCCCA GTGCCCCAGG CCCGCTGGTG 4860 

TTCACTGCCC TGAGCCCAGA CTCGCTGCAG CTGAGCTGGG AGCGGCCACG GAGGCCCAAT 4 92 0 

GGGGATATCG TCGGCTACCT GGTGACCTGT GAGATGGCCC AAGGAGGAGG GCCAGCCACC 4980 

GCATTCCGGG TGGATGGAGA CAGCCCCGAG AGCCGGCTGA CCGTGCCGGG CCTCAGCGAG 5040 

AACGTGCCCT ACAAGTT CAA GGTGCAGGCC AGGACCACTG AGGGCTTCGG GCCAGAGCGC 5100 

GAGGGCATCA TCACCATAGA GTCCCAGGAT GGAGGACCCT TCCCGCAGCT GGGCAGCCGT 5160 

GCCGGGCTCT TCCAGCACCC GCTGCAAAGC GAGTACAGCA GCATCACCAC CACCCACACC 5220 

AGCGCCACCG AGCCCTTCCT AGTGGATGGG CCGACCCTGG GGGCCCAGCA CCTGGAGGCA 5280 

GGCGGCTCCC TCACCCGGCA TGTGACCCAG GAGTTTGTGA GCCGGACACT GACCACCAGC 5340 

GGAACCCTTA GCACCCACAT GGACCAACAG TTCTTCCAAA CTTGACCGCA CCCTGCCCCA 5400 

CCCCCGCCAT GTCCCACTAG GCGTCCTCCC GACTCCTCTC CCGGAGCCTC CTCAGCTACT 5460 

CCATCCTTGC ACCCCTGGGG GCCCAGCCCA CCCGCATGCA CAGAGCAGGG GCTAGGTGTC 552 0 

TCCTGGGAGG CATGAAGGGG GCAAGGTCCG TCCTCTGTGG GCCCAAACCT ATTTGTAACC 5580 

AAAGAGCTGG GAGCAGCACA AGGACCCAGC CTTTGTTCTG CACTTAATAA ATGGTTTTGC 5640 
TACTG 

Seq ID NO: 561 Protein sequence 
Protein Accession #: NP_000204.1 

1 11 21 31 41 51 

i I I I' 1 1 

MAGPRPSPWA RLLLAALISV SLSGTLANRC KKAPVKSCTE CVRVDKDCAY CTDEMFRDRR 60 

CNTQAELLAA GCQRESIWM ESSFQITEET QIDTTLRRSQ MSPQGLRVRL RPGEERHFEIj 120 

EVFEPLESPV DLYILMDFSN SMSDDLDNLK KMGQNLARVL SQLTSDYTIG FGKFVDKVSV 180' 

PQTDMRPEKL KEPWPNSDPP FSFKNVISLT EDVDEFRNKL QGERISGNLD APEGGFDAIL 240 

QTAVCTRDIG WRPDSTHLLV FSTESAFHYE ADGANVLAGI MSRNDERCHL DTTGTYTQYR 300 

TQDYPSVPTL VRLLAKHNI I PIFAVTNYSY SYYEKLHTYF PVSSLGVLQE DSSNIVELLE 3 60 

EAFNRIRSNL DIRALDSPRG LRTEVTSKMF QKTRTGSFHI RRGEVGIYQV QLRALEHVDG 420 

THVCQLPEDQ KGNIHLKPSF SDGLKMDAGI ICDVCTCELQ KE VRS ARCS F NGDFVCGQCV 48 0 

CSEGWSGQTC NCSTGSLSDI QPCLREGEDK PCSGRGECQC GHCVCYGEGR YEGQFCEYDN 540 

FQCPRTSGFL CNDRGRCSMG QCVCEPGWTG PSCDCPLSNA TCIDSNGGIC NGRGHCECGR 60 0 

CHCHQQSLYT DTICEINYSA IHPGLCEDLR SCVQCQAWGT GEKKGRTCEE CNFKVKMVDE 660 

LKRAEEVWR CSFRDEDDDC TYSYTMEGDG APGPNSTVLV HKKKDCPPGS FWWLIPLLLL 72 0 

LLPLLALLLL LCWKYCACCK ACLALLPCCN RGHMVGFKED HYMLRENLMA SDHLDTPMLR 780 

SGNLKGRDW RWKVTNNMQR PGFATHAASI NPTELVPYGL SLRLARLCTE NLLKPDTREC 840 

AQLRQEVEEN LNEVYRQISG VHKLQQTKFR QQPNAGKKQD HTIVDTVLMA PRSAKPALLK 900 

LTEKQVEQRA FHDLKVAPGY YTLTADQDAR GMVEFQEGVE LVDVRVPLFI RPEDDDEKQL 960 

LV EA I D VP AG TATLGRRLVN ITIIKEQARD WSFEQPEFS VSRGDQVARI PVIRRVLDGG 102 0 

KSQVSYRTQD GTAQGNRDY I PVEGELLFQP GEAWKELQVK LLELQEVDSL LRGRQVRRFH 10 80 

VQLSNPKFGA HLGQPHSTTI IIRDPDELDR SFTSQMLSSQ PPPHGDLGAP QNPNAKAAGS 1140 

RKIHFNWLPP SGKPMGYRVK YWIQGDSESE AHLLDSKVPS VELTNLYPYC DYEMKVCAYG 12 00 

AQGEGPYSSL VSCRTHQEVP SEPGRLAFNV VSSTVTQLSW AEPAETNGEI TAYEVCYGLV 12 60 

NDDNRPIGPM KKVLVDNPKN RMLL1ENLRE SQPYRYTVKA RNGAGWGPER EAIINLATQP 1320 

KRPMSIPIIP DIPIVDAQSG EDYDSFLMYS DDVLRSPSGS QRPSVSDDTE HLVNGRMDFA 13 80 

FPGSTNSLHR MTTTSAAAYG THLSPHVPHR VLSTSSTI/TR DYNSLTRSEH SHSTTLPRDY 1440 

STLTSVSSHD SRLTAGVPDT PTRLVFSALG PTSLRVSWQE PRCERPLQGY SVEYQLLNGG 1500 

ELHRLNIPNP AQTSVWEDL LPNHSYVFRV RAQSQEGWGR EREGVITIES QVHPQSPLCP 15 60 

LPGSAFTLST PSAPGPLVFT ALSPDSLQLS WERPRRPNGD IVGYLVTCEM AQGGGPATAF 1620 

RVDGDSPESR LTVPGLSENV PYKFKVQART TEGFGPEREG IITIESQDGG PFPQLGSRAG 1680 

LFQHPLQSEY SSI TTTHTS A TEPFLVDGPT LGAQHLEAGG SLTRHVTQEF VSRTLTTSGT 1740 
LSTHMDQQFF QT 

Seq ID NO: 562 DNA sequence 

Nucleic Acid Accession #: NM_013332.1 

Coding sequence : 1 . . 63 

1 11 21 31 41 51 



399 



10 



15 



20 



25 



WO 02/086443 

GCACGAGGGC GCTTTTGTCT 
AGTAACCGAC TTTCCTCCGG 
CGGCTGTTCC CCCGGAGGGT 
GCAGAGGAGT AGGGTCCTTT 
GGTACTGACC CTACTCTCCA 
GAGCCCATCG CCTGGGACCT 
CAAGGGCCTT CCAGACCATC 
ATATTTTGGA ACACTGACCT 
TGAGCACCGT TGTAACCAGA 
CTCATTGCCT GGGCAAGGCC 
CACTTTGGGA GGCTGAGGTG 
CAACATGGCG AAACCCCATC 
GGCCTGTAAT CCCAGTTCCT 
GAGGTTGCAG TGAACCGAGA 
CATCTCAAAA AAAAAAAGAA 
TTATGGCTAT GAGATAGGTT 
TCCTCAGCAG TATGGCTCTG 
TGATATTTTC AACCCTACTT 
TATGCTCAAT TATTTGGTGT 
CAGTTGAAGA GGTTGTGTGG 
TTCTCATTTT ACATTTTAAA 
GGTGGGATGC CAAAGCCTGC 
TTTTTTCTAA CTAATAAAGT 



PCT/US02/12476 



CCGGTGAGTT 
ACTCCTGCAC 
CCAGAGGCCT 
CAGCCATGAA 
TCTTCGTTAG 
CCTGGACCAC 
CATCCAGAAG 
AGACATGTCC 
GAACTATTAC 
TGTTTAGGCC 
GGTGGAT C AC 
TCTACTAAAA 
TGGGAGGCTG 
TCGCACTGCT 
AAGAAAAAGC 
GATCTCGCCC 
ACATCT CTT A 
CCTAAACATC 
TGAGCCTCTC 
GTGGGCTGTT 
GTCGTTCCTC 
TCAAGTTATG 
GGAATATATA 



TTGTGGCGGG 
GACCTGCTCC 
TTCAGAAGGA 
GCATGTGTTG 
AGTGATGGAG 
CAGAAGCCAA 
CATGTGATAA 
AGATGGGAGT 
TAGGCCTTGA 
GGTTGCGGTG 
CTGAGGTCAG 
ATACAAAAGT 
AGGCGGGAGA 
GTACCCAGCC 
CTGTTTAATG 
TTACCCCGGG 
GATGTCCCAA 
TGTCTGGGGT 
TTCCACAAGA 
GGGAGTGAGG 
CAACATAGTG 
GACATTGTGG 
TTTCAAAAAA 



AAGCTTCTGC 
TACAGCCGGC 
GAAGGCAGCT 
AACCTCTACC 
TCCCTAGAAG 
CTAGCCAACA 
GACCTCCTTC 
CCCATTCCTA 
AGAACCTGTC 
GCTCATGCCT 
GAGTTCGAGA 
TAGCTGGGTG 
ATTGCTTGAA 
TGGGCCACAG 
CACAGGTGTG 
GTCTGGTGTA 
CTTCAGCTGT 
TCCTTTAGTC 
GCTCCTCCAT 
ATGGAGTGTT 
TGTATTGGTC 
CCACCATGTG 
AAAAAAAAAA 



GCTGGTGCTT 60 

GATCCACTCC 120 

CTGTTTCTCT 180 

TGTTAGGTGT 240 

GCTTACTAGA 300 

CAGAGCCCAC 3 60 

CATACTGGCC 420 

GCAGACAAGC 480 

TAACTGGATG 540 

GTAATCCTAG 600 

CCAGCCTCGC 660 

TGGTGGCAGA 720 

CCCGGGGACG 780 

TGCAAGACTC 840 

AGTGGATTGC 90 0 

TGCTGTGCTT 960 

TGGGAGATGG 102 0 

TTGAATGTCT 1080 

GTTTGGATAG 1140 

CAGTGCCCAT 1200 

TGAAGGGGGT 12 60 

GCTTAAATGA 132 0 
AA 



Seq ID NO: 563 Protein sequence 
Protein Accession #: NP 037464.1 



1 11 21 31 41 51 

-« I I I II I 

JU MKHVLNLYLL GWLTLLSIF VRVMESLEGL LESPSPGTSW TTR SQL ANTE PTKGLPDHPS 

RSM 



60 



35 



Seq ID NO: 564 DNA sequence 

Nucleic Acid Accession #: NM_023 915.1 

Coding sequence: 250.. 1326 



40 



45 



50 



55 



60 



GGCACGAGGG 
TCAAAGCTTA 
GTGAATGGAC 
CCCACGCCTC 
AACTGAAGAA 
CAAGAGAGTC 
AATGAATTTG 
TTGCTGAATG 
TTCTATCTCA 
ATAGTCCATG 
TCAGTTTTGT 
GAT CGCTAT C 
ACGAAGGTTT 
ATCCTGACAA 
CCTTTGGGGG 
GTGCTGGTGA 
AGGCAATTCA 
GTGGCTGTGT 
AGTCACTTAG 
ATTACACTTT 
TGTAGGTCAT 
ATCAGATCAC 
GTGTAGGCCT 
TTCATTATCC 



11 

I 

TTTCGTTTTC 
TTCTTAATTA 
AGCCAGCCAC 
AATCGTCCCC 
TGGGGTTCAA 
ACAATTCAGG 
ACACAATTGT 
GTTTAG CAGT 
AAAACATAGT 
ATGCAGGATT 
TTTATGCAAA 
TGAAGGTGGT 
TATCTGTTTG 
ATGGTCAGCC 
TCAAATGGCA 
TTCTGATCGG 
TAAGTCAGTC 
TTTTTACCTG 
ACAGGCTTTT 
TCTTGTCTGC 
TTTCAAGAAG 
TGCAAAGTGT 
TTTATTGTTT 
TTAAAAAAAA 



21 
I 

ATGCTTTACC 
GAGACAAGAA 
CACAATGAAA 
AAGTGTTTCC 
CTTGACGCTT 
CAACAGGAGC 
CTTGCCGGTG 
GTGGATCTTC 
GGTTGCAGAC 
TGGACCTTGG 
CATGTATACT 
CAAGCCATTT 
TGTTTGGGTG 
AACAGAGGAC 
TACGGCAGTC 
ATGTTACATA 
AAGCCGAAAG 
CTTTCTACCA 
AGATGAATCT 
GTGTAATGTT 
GCTGTTCAAA 
GAGAAGATCG 
GTTGGAATCG 
AA 



31 

I 

AGAAAATCCA 
ACCTGTTTCA 
GAAATCAAAC 
TGACACGCAT 
GCAAAATTAC 
GACGGGCCAG 
CTTTATCTCA 
TTCCACATTA 
CT CAT AATGA 
TACTTCAAGT 
TCCATCGTGT 
GGGGACTCTC 
AT CATGGCTG 
AATATCCATG 
ACCTATGTGA 
GCCATATCCA 
CGAAAACATA 
TATCACTTGT 
GCACAAAAAA 
TGCCTGGATC 
AAATCAAATA 
GAAGTTCGCA 
ATATGTACAA 



41 
I 

CTTCCCTGCC 
ACTTGAAGAC 
CAGGAATAAC 
CTTTGCTTAC 
CAAATAACGA 
GAAAGAACAC 
TTATATTTGT 
GGAATAAAAC 
CGCTGACATT 
TTATTCTCTG 
TCCTTGGGCT 
GGATGTACAG 
TTTTGTCTTT 
ACTGCTCAAA 
ACAGCTGCTT 
GGTACATCCA 
ACCAGAGCAT 
GCAGAATTCC 
TCCTATATTA 
CAATAATTTA 
T CAG AACCAG 
TATATTATGA 
AGTGTAAATA 



51 
I 

GACCT TAGTT 60 

ACCGTATGAG 120 

CTATGCTGAA 180 

AGTGCAT C AC 240 

GCTGCACGGC 3 00 

CACCCTTCAC 3 60 

GGCAAGCATC 420 

CAGCTTCATA 480 

TCCATTTCGA 540 

CAGATACACT 600 

GATAAGCATT 660 

CATAACCTTC 720 

GCCAAACATC 780 

ACTTAAAAGT 840 

GTTTGTGGCC 900 

CAAATCCAGC 960 

CAGGGTTGTT 102 0 

TTTTACTTTT 1080 

CTGCAAAGAA 1140 

CTTTTTCATG 12 00 

GAGTGAAAGC 12 60 

TTACACTGAT 1320 

AATGTTTCTT 13 80 



Seq ID NO: 565 Protein sequence 
65 Protein Accession #: NP 076404 



70 



75 



80 



85 



MGFNLTLAKL 
GLAVWIFFHI 
FYANMYTSIV 
NGQPTEDNIH 
ISQSSRKRKH 
FLSACNVCLD 



11 
I 

PNNELHGQES 
RNKTSFIFYL 
FLGLISIDRY 
DCSKLKSPLG 
NQSIRVWAV 
PIIYFFMCRS 



21 



HNSGNRSDGP 
KNIWADLIM 
LKWKPFGDS 
VKWHTAVTYV 
FFTCFLPYHL 
FSRRLFKKSN 



31 
I 

GKNTTLHNEF 
TLTFPFRIVH 
RMYSITFTKV 
NSCLFVAVLV 
CRIPFTFSHL 
IRTRSESIRS 



41 
I 

DTIVLPVLYL 
DAGFGPWYFK 
LSVCVWVIMA 
ILIGCYIAIS 
DRLLDESAQK 
LQSVRRSEVR 



51 



IIFVASILLN 
FILCRYTSVL 
VLSLPNIILT 
RYIHKSSRQF 
ILYYCKEITL 
IYYDYTDV 



Seq ID NO: 566 DNA sequence 

Nucleic Acid Accession #: NM_005365.1 

Coding sequence: 1..94 8 



ATGTCTCTCG 
GAGGACTTGG 
TCCTCTGACA 
CCTCAGGGAG 
GAGGGCTCCA 
GAGTTCATGT 



11 

i 

AGCAGAGGAG 
GCCTGATGGG 
GCAAGGAGGA 
GCGCTTCCTC 
GCAGTCAAGA 
TCCAAGAAGC 



21 
I 

TCCGCACTGC 
TGCACAGGAA 
GGAGGTGT CT 
CTCCATTTCC 
AGAGGAAGAG 
ACTGAAATTG 



31 
I 

AAGCCTGATG 
CCCACAGGCG 
GCTGCTGGGT 
GTCTACTACA 
CCAAGCTCCT 
AAGGTGGCTG 



41 



51 



AAGACCTTGA 
AGGAGGAGGA 
CATCAAGTCC 
CTTTATGGAG 
CGGTCGACCC 
AGTTGGTTCA 



AGCCCAAGGA 
GACTACCTCC 
TCCCCAGAGT 
CCAATTCGAT 
AGCTCAGCTG 
TTTCCTGCTC 



60 
120 
180 
240 
300 



60 
120 
180 
240 
300 
360 



400 



WO 02/086443 

CACAAATATC GAGTCAAGGA GCCGGTCACA AAGGCAGAAA TGCTGGAGAG CGTCATCAAA 
AATTACAAGC GCTACTTTCC TGTGATCTTC GGCAAAGCCT CCGAGTTCAT GCAGGTGATC 
TTTGGCACTG ATGTGAAGGA GGTGGACCCC GCCGGCCACT CCTACATCCT TGTCACTGCT 
CTTGGCCTCT CGTGCGATAG CATGCTGGGT GATGGTCATA GCATGCCCAA GGCCGCCCTC 
CTGATCATTG TCCTGGGTGT GAT CCTAACC AAAGACAACT GCGCCCCTGA AGAGGTTATC 
TGGGAAGCGT TGAGTGTGAT GGGGGTGTAT GTTGGGAAGG AGCACATGTT CTACGGGGAG 
CCCAGGAAGC TGCTCACCCA AGATTGGGTG CAGGAAAACT ACCTGGAGTA CCGGCAGGTG 
CCCGGCAGTG ATCCTGCGCA CTACGAGTTC CTGTGGGGTT CCAAGGCCCA CGCTGAAACC 
AGCTATGAGA AGGTCATAAA TTATTTGGTC ATGCTCAATG CAAGAGAGCC CATCTGCTAC 
CCATCCCTTT ATGAAGAGGT TTTGGGAGAG GAGCAAGAGG GAGTCTGA 

Seq ID NO: 567 Protein sequence 
Protein Accession #: NP_005356.1 

1 11 21 31 41 51 

I i I I I I 

MSLEQRSPHC KPDEDLEAQG EDLGLMGAQE PTGEEEETTS SSDSKEEEVS AAGSSSPPQS 

PQGGASSSIS VYYTLWSQFD EGSSSQEEEE PSSSVDPAQL EFMFQEALKL KVAELVHFLL 

HKYRVKEPVT KAEMLE S V I K NYKRYFPVIF GKASEFMQVI FGTDVKEVDP AGHSYILVTA 

LGLSCDSMLG DGHSMPKAAL LIIVLGVILT KDNCAPEEVI WEALSVMGVY VGKEHMFYGE 

PRKLLTQDWV QENYLEYRQV PGSDPAHYEF LWGSKAHAET SYEKVINYLV MLNAREPICY 

PSLYEEVLGE EQEGV 

Seq ID NO: 568 DNA sequence 
Nucleic Acid Accession #: NM_014400 
Coding sequence: 86.. 1126 

1 11 21 31 41 51 

I I I I l l 

GGTTACTCAT CCTGGGCTCA GGTAAGAGGG CCCGAGCTCG GAGGCGGCAC ACCCAGGGGG 

GACGCCAAGG GAGCAGGACG GAG C CATGG A CCCCGCCAGG AAAG CAGGTG CCCAGGCCAT 

GATCTGGACT GCAGGCTGGC TGCTGCTGCT GCTGCTTCGC GGAGGAGCGC AGGCCCTGGA 

GTGCTACAGC TGCGTGCAGA AAGCAGATGA CGGATGCTCC CCGAACAAGA TGAAGACAGT 

GAAGTGCGCG CCGGGCGTGG ACGTCTGCAC CGAGGCCGTG GGGGCGGTGG AGACCATCCA 

CGGACAATTC TCGCTGGCAG TGCSGGGTTG CGGTTCGGGA CTCCCCGGCA AGAATGACCG 

CGGCCTGGAT CTTCACGGGC TTCTGGCGTT CATCCAGCTG CAGCAATGCG CTCAGGATCG 

CTGCAACGCC AAGCTCAACC TCACCTCGCG GGCGCTCGAC CCGGCAGGTA ATGAGAGTGC 

ATACCCGCCC AACGGCGTGG AGTGCTACAG CTGTGTGGGC CTGAGCCGGG AGGCGTGCCA 

GGGTACATCG CCGCCGGTCG TGAGCTGCTA CAACGCCAGC GATCATGTCT ACAAGGGCTG 

CTTCGACGGC AACGT CACCT TGACGGCAGC TAATGTGACT GTGTCCTTGC CTGTCCGGGG 

CTGTGTCCAG GATGAATTCT GCACTCGGGA TGGAGTAACA GGCCCAGGGT TCACGCTCAG 

TGGCTCCTGT TGCCAGGGGT CCCGCTGTAA CTCTGACCTC CGCAACAAGA CCTACTTCTC 

CCCTCGAATC CCACCCCTTG TCCGGCTGCC CCCTCCAGAG CCCACGACTG TGGCCTCAAC 

CACATCTGTC ACCACTTCTA CCTCGGCCCC AGTGAGACCC ACATCCACCA CCAAACCCAT 

GCCAGCGCCA ACCAGTCAGA CTCCGAGACA GGGAGTAGAA CACGAGGCCT CCCGGGATGA 

GGAGCCCAGG TTGACTGGAG GCGCCGCTGG CCACCAGGAC CGCAGCAATT CAGGGCAGTA 

TCCTGCAAAA GGGGGGCCCC AGCAGCCCCA TAATAAAGGC TGTGTGGCTC CCACAGCTGG 

ATTGGCAGCC CTTCTGTTGG CCGTGGCTGC TGGTGTCCTA CTGTGAGCTT CTCCACCTGG 

AAATTTCCCT CTCACCTACT TCTCTGGCCC TGGGTACCCC TCTTCTCATC ACTTCCTGTT 

CCCACCACTG GACTGGGCTG GCCCAGCCCC TGTTTTTCCA ACATTCCCCA GTATCCCCAG 

CTTCTGCTGC GCTGGTTTGC GGCTTTGGGA AATAAAATAC CGTTGTATAT ATTCTGGCAG 

GGGTGTTCTA GCTTTTTGAG GACAGCTCCT GTATCCTTCT CATCCTTGTC TCTCCGCTTG 

TCCTCTTGTG ATGTTAGGAC AGAGTGAGAG AAGTCAGCTG TCACGGGGAA GGTGAGAGAG 

AGGATGCTAA GCTTCCTACT CACTTTCTCC TAGCCAGCCT GGACTTTGGA GCGTGGGGTG 

GGTGGGACAA TGGCTCCCCA CTCTAAGCAC TGCCTCCCCT ACTCCCCGCA TCTTTGGGGA 

ATCGGTTCCC CATATGT CTT CCTTACTAGA CTGTGAGCTC CTCGAGGGCA GGGACCGTGC 

CTTATGTCTG TGTGTGATCA GTTTCTGGCA CATAAATGCC TCAATAAAGA TTTAATTACT 
TTGTATAGTG AAAAAAAA 

Seq ID NO: 569 Protein sequence 
Protein Accession #: NP_055215 

1 11 21 31 41 51 

I i l l I I 

MDPARKAGAQ AMIWTAGWLL LLLLRGGAQA LECYSCVQKA DDGCSPNKMK TVKCAPGVDV 
CTEAVGAVET IHGQFSLAVX GCGSGLPGKN DRGLDLHGLL AFIQLQQCAQ DRCNAKLNLT 
SRALDPAGNE SAYPPNGVEC YSCVGDSREA CQGTSPPWS CYNASDHVYK GCFDGNVTLT 
AANVTVSLPV RGCVQDEFCT RDGVTGPGFT LSGSCCQGSR CNSDLRNKTY FSPRIPPLVR 
LPPPEPTTVA STTSVTTSTS APVRPTSTTK PMPAPTSQTP RQGVEHEASR DEEPRLTGGA 
AGHQDRSNSG QYPAKGGPQQ PHNKGCVAPT AGLAALLLAV AAGVLL 

Seq ID NO : 570 DNA sequence 

Nucleic Acid Accession #: NM_00532 9.1 

Coding sequence: 1..1662 

1 11 21 31 41 51 

1 I I I I I 

ATGCCGGTGC AGCTGACGAC AGCCCTGCGT GTGGTGGGCA CCAGCCTGTT TGCCCTGGCA 

GTGCTGGGTG GCATCCTGGC AGCCTATGTG ACGGGCTACC AGTTCATCCA CACGGAAAAG 

CACTACCTGT CCTTCGGCCT GTACGGCGCC ATCCTGGGCC TGCACCTGCT CATTCAGAGC 

CTTTTTGCCT TCCTGGAGCA CCGG CGCATG CGACGTGCCG GCCAGGCCCT GAAGCTGCCC 

TCCCCGCGGC GGGGCTCGGT GGCACTGTGC ATTGCCGCGT ACCAGGAGGA CCCTGACTAC 

TTGCGCAAGT GCCTGCGCTC GGCCCAGCGC ATCTCCTTCC CTGACCTCAA GGTGGTCATG 

GTGGTGGATG GCAACCGCCA GGAGGACGCC TACATGCTGG ACATCTTCCA CGAGGTGCTG 

GGCGGCACCG AGCAGGCCGG CTTCTTTGTG TGGCGCAGCA ACTTCCATGA GGCAGGCGAG 

GGTGAGACGG AGGCCAGCCT GCAGGAGGGC ATGGACCGTG TGCGGGATGT GGTGCGGGCC 

AGCACCTTCT CGTGCAT CAT GCAGAAGTGG GGAGGCAAGC GCGAGGT CAT GTACACGGCC 



401 



10 



15 



WO 02/086443 

TTCAAGGCCC TCGGCGATTC 
GATCCAGCCT G C AC CAT CG A 
GTCGGGGGAG ATGTCCAGAT 
GTGCGGTACT GGATGGCCTT 
CAGTGTATTA GTGGGCCCTT 
GACTGGTACC ATCAGAAGTT 
ACCAACCGAG TCCTGAGCCT 
ACAGAGACCC CCACTAAGTA 
TACTTCCGGG AGTGGCTCTA 
TACGAGTCAG TGGTCACGGG 
TTCTACCGGG GCCGCATCTG 
ATTATCAAGG CCACCTACGC 
CTCTACTCCC TCCTCTATAT 
ATCAACAAAT CTGGCTGGGG 
CTCATTCCTG TGTCCATCTG 
TGCCAGGACC TGTTCAGTGA 
GGCTGCTACT GGGTGGCCCT 
AAGAAGCCGG AGCAGTACAG 



PCT/US02/12476 



GGTGGACTAC 
GATGCTTCGA 
CCTCAACAAG 
CAACGTGGAG 
GGGCATGTAC 
CCTAGGCAGC 
TGGCTACCGA 
CCTCCGGTGG 
CAACTCTCTG 
T.TTCT TCCCC 
GAACATTCTC 
CTGCTTCCTT 
GTCCAGCCTT 
CACCTCTGGC 
GGTGGCAGTT 
GACAGAGCTA 
CCTCATGCTA 
CTTGGCTTTT 



ATCCAGGTGT 
GTCCTGGAGG 
TACGACTCAT 
CGGGCCTGCC 
CGCAACAGCC 
AAGTGCAGCT 
ACTAAGTATA 
CTCAACCAGC 
TGGTTCCATA 
TTCTTCCTCA 
CTCTTCCTGC 
CGGGGCAATG 
CTGCCGGCCA 
CGAAAAACCA 
CTCCTGGGAG 
GCCTTCCTTG 
TATCTGGCCA 
GCTGAGGTGT 



GCGACTCTGA 
AGGATCCCCA 
GGATTTCCTT 
AGTCCTACTT 
TCCTCCAGCA 
TCGGGGATGA 
CCGCGCGCTC 
AAACCCGCTG 
AGCACCACCT 
TTGCCACGGT 
TGACGGTGCA 
CAGAGATGAT 
AGATCTTTGC 
TTGTGGTGAA 
GGCTGGCCTA 
TCTCTGGGGC 
TCATCGCCCG 
GA 



CACTGTGCTG 660 

AGTAGGGGGA 720 

CCTGAGCAGC 780 

TGGCTGTGTG 840 

GTTCCTGGAG 900 

CCGGCACCTC 960 

CAAGTGCCTC 1020 

GAGCAAGTCT 1080 

CTGGATGACC 1140 

TATACAGCTT 1200 

GCTGGTGGGC 1260 

CTTCATGTCC 132 0 

CATTGCTACC 1380 

CTTCATTGGC 1440 

CACAGCTTAT 1500 

TATACTGTAT 1560 

GCGATGTGGG 1620 



20 



Seq ID NO: 571 Protein sequence 
Protein Accession #: NP 005320.1 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



I 

MPVQLTTALR 
LFAFLEHRRM 
WDGNRQEDA 
STFSCIMQKW 
VGGDVQILNK 
DWYHQKFLGS 
YFREWLYNSL 
1 1 KATYACFIi 
LIPVSIWVAV 
KKPEQYSLAF 



11 

1 

WGTSLFALA 
RRAGQALKLP 
YMLDIFHEVL 
GGKREVMYTA 
YDSWISFLSS 
KCSFGDDRHL 
WFHKHHLWMT 
RGNAEMIFMS 
LLGGLAYTAY 
AEV 



21 



VLGGILAAYV 
SPRRGSVALC 
GGTEQAGFFV 
FKALGDSVDY 
VRYWMAFNVE 
TNRVLSLGYR 
YESWTGFFP 
LYSLLYMSSL 
CQDLFSETEL 



31 

! 

TGYQFIHTEK 
IAAYQEDPDY 
WRSNFHEAGE 
IQVCDSDTVL 
RACQSYFGCV 
TKYTARSKCL 
FFLIATVIQL 
LPAKIFAIAT 
AFLVSGAILY 



41 



51 



HYLSFGLYGA 
LRKCLRSAQR 
GETEASLQEG 
DPACTIEMLR 
QCISGPLGMY 
TETPTKYLRW 
FYRGRIWNIL 
INKSGWGTSG 
GCYWVALLML 



ILGLHLLIQS 
I SFPDLKWM 
MDRVRDWRA 
VLEEDPQVGG 
RNSLLQQFLE 
LNQQTRWSKS 
LFLLTVQLVG 
RKTIWNFIG 
YLAI I ARRCG 



Seq ID NO: 572 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 148-7095 



11 



21 



31 



41 



51 



85 



CACACATACG 
CAAAAAAAAC 
CGGCGAGGGG 
CAGCTCCTCT 
CTTGTTGAAG 
AAATATCCAA 
CAAGTAAATG 
AACACATTCA 
GTCAGCGGAG 
AAATGCAATA 
GAGATGCAAA 
GGAAAAGGGA 
GATT TCAAAG 
TTAGATCCAT 
AATGG CT CAT 
ACAGTTAGCA 
TCTGGTTATG 
TTCTCTAGAC 
AGTTCAGAAC 
TGGGAAAGAC 
CAGTTGGATG 
GGTGCTATTC 
TGCACTAATG 
AATCCTGAAC 
GAAGAGGGAA 
AACCAAATCA 
ACGAAATACA 
AAGGGTGATG 
ACAGAAAAAG 
GAAGGTACTT 
AACTTGTCGG 
AGTTTATTGA 
GCAACTTCTG 
GAAAACCCAG 
GAAGATTCAA 
GTGTGGTTTC 
AGCTTTCTCC 
TCCTTTTCTG 
CATTATTCTA 
TCCAGACAAC 
GTATACAATG 
ACCCCTTTGT 
TCGGCCTTGC 
TCTTCCTATG 
TTTCGCCATC 
GATAAGGTGC 



CACGCACGAT 
ATTTCCTTCG 
CCGCAGACCG 
GTGTTTGCCG 
AGATTGGCTG 
CATGTAATAG 
TGAATCTTAA 
TTCATAACAC 
GAGTTTCAGA 
TGTCATCTGA 
TCTACTGCTT 
AGTTAAGAGC 
CGATTATTGA 
TCATACTGTT 
TGACATCTCC 
TCTCTGAAAG 
TCATGCTGAT 
AGGTGTTTTC 
CAGAAAATGT 
CT CGAGTCGT 
GAGAGGACCA 
TCAATAATTT 
GCTTATATGG 
TTGATCTTTT 
AAGACATTGA 
GGAAAAAGGA 
ATGAAGCCAA 
TTCCCAATAC 
ATATTTCCTT 
CAGCCTCTTT 
GGACTGCAGA 
CCAGTTTCAA 
CTATCCCATT 
AGACAATAAC 
CTTCATCAGG 
CTAGCTCTAC 
AGACTAATTA 
CAGGCCCAGT 
CCTTTGCCTA 
AGGATTTGGT 
GTGAGACACC 
TGCTTGACAA 
ATGCTACGCC 
ATGGTGCACC 
TGCATACAGT 
CCTTGCATGC 



CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 
TGGGAAAACA 
AATGGTGTTT 
TGGATCAGAG 
TGATGCGGAC 
TTTATCCATT 
TGGAGTCGAA 
GAACCTTCTG 
TCCCTGCACA 
CCAGTTGGCT 
GGACTACTTA 
CTCATACACT 
TCAGGCTGAC 
TTATGATACC 
AACCAAGCAT 
GCTACCCAAT 
AAAAT ACAG C 
CCCTGAATTA 
AGAAGGCGCT 
ACCCCAGATT 
GACTAACCGA 
ATCTTTAAAT 
GACTTCTCAG 
AAATGATGGC 
AT CCTT AAAT 
GCTTGATACT 
CATCTCTGAG 
ATATGATGTC 
TTCAGAAGAA 
AGACATAACA 
CACTGAGATA 
GATGTCACAG 
CTTCCCAACT 
CTCCACGGTC 
TCTTCAACCT 
TCAGATCCTC 
TGTATTTCCC 
TTTGCTTCCA 
TTCTCAAATC 
TTCTCTGCCA 



TCTATACACT 
CTCTCCACTC 
CGAATCCTAA 
GCTAATGGAT 
GGAGCACTGA 
TCTCCTATCA 
TTTCAGGGTT 
GTGGAAATTA 
AAAGCAAGCA 
CATAGTTTAG 
CGATTTTCAA 
TTGTTTGAGG 
AGTGTTAGTC 
CCAAACTCAA 
GACACAGTTG 
GTTTTTTGTG 
CAAAACAATT 
GGAAAGGAAG 
CCAGAGAATT 
ATGATTGAGA 
GAATTTTTGA 
ATGAGTTATG 
G AC CAACTG A 
ATTGGAACTG 
ATTGTGAATC 
TCTACCACAA 
TCCCCAACAA 
TCCACTTCCC 
ACTGTGACTG 
TCTAAAACTG 
ACAGTTTCTA 
GGAGCTGAAG 
AACATAT CCC 
CTTATACCAG 
TCACTAAAGG 
GCACAGCCCG 
CGTGTTGATG 
GGTCCCTCAG 
GAGGTAACAC 
AACGTGGTAT 
TCCTACAGTA 
AACACTACCC 
AGTGT CGATG 
TTTTCCTCTG 
CTTCCACAAG 
GTGGCTGGGG 



GGAGGATTAA 
TGAGAAGCAG 
AGCGTTTCCT 
ACTACAGACA 
ATCAAAAAAA 
ATATTGATGA 
GGGATAAAAC 
ATCT CACTAA 
AGATAACTTT 
AAGGACAAAA 
GTTTTGAGGA 
TTGGGACAGA 
GTTTTGGGAA 
CTGACAAGTA 
ACTGGATTGT 
AAGTT CTTAC 
TTCGAGAGCA 
AGATT CATGA 
ATACCAGCCT 
AGTTTGCAGT 
CAGATGGCTA 
TTCTTCAGAT 
TTGTCGACAT 
AAGAAATAAT 
CTGGTAGAGA 
CACACTACAA 
GAGGAAGTGA 
AACCAGTCAC 
AACTGCCACC 
TTCTTAGATC 
TAACAGAATA 
ATTCTTCAGG 
AAGGGTATAT 
AATCTGCTAG 
ATCCTTCTAT 
ATGTTGGATC 
AATCTGAGAA 
TTACAGATCT 
CTCATGCTTT 
ACT CGCAGAC 
GTGAAGTCTT 
CTGCTGCTTC 
TGTCATTTGA 
CTTCCTTCAG 
TTACTTCAGC 
GTGATTTGCT 



AACAAACAAA 
AGGAGCCGCA 
CGCTTGCATT 
A GAG AGAAAA 
TTGGGGAAAG 
AGATCTTACA 
AT CATTGGAA 
TGACTACCGT 
TCACTGGGGA 
ATTTCCACTT 
AGCAGTCAAA 
AGAAAATTTG 
GCAGGCTGCT 
TTACATTTAC 
TTTTAAAGAT 
AATGCAACAA 
ACAGTACAAG 
AGCAGTTTGT 
TCTTGTTACA 
TTTGTACCAG 
TCAAGACTTG 
AGTAGCCATA 
GCCTACTGAT 
CAAGGAGGAG 
CAGTGCTACA 
TCGCATAGGG 
ATTCTCTGGA 
TAAATTAGCC 
TCACACTGTG 
TCCACATATG 
TGAGGAGGAG 
CTCCAGTCCC 
ATTTTCCTCC 
AAATGCTTCC 
GGAGGGAAAT 
AGGCAGAGAG 
GACAACCAAG 
GGAAATGCCA 
TACCCCATCC 
AACCCAACCG 
TCCTCTAGTC 
AAGTAGTGAT 
ATCCATCCTG 
TAGTGAATTG 
TACCGAGAGT 
ATTAGAGCCC 



60 
120 
180 
240 
300 
360 
420 
480 
540 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
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65 
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AGCCTTGCTC AGTATTCTGA 
TTTGGTAGTG AATCTGGTGT 
AGCAGTGATG CCATGATGCA 
GATAATGAGG GCTCCCAACA 
GATT CTGTGG GTGTAACTTA 
CCTAAGTCTT CGTTAATAAC 
GGTGATGGGG AATGGT CTGG 
GGGCTGACAG CCCTTAACAT 
TCTGTGTTTG GTGATGATAA 
ACTGAACTGC AAATTCCTTC 
CCCAACATGT ATGATAATGT 
ATTTCTAGCA CCAAGGGCAT 

GATCATGAGA TTAGTCAAGT 
TCTCAAGCAT CTGGTGACAC 
TCCTCTGACC CTGCTTCTAG 
ACCTCAGCTT CTTTTAGTAC 
GACACCTTGC TTAAAACTGT 
CCCAAAGTTG ATAAAATTAG 
AGTGAAAACA TGCTGCACTC 
ATGCACTCTG CTTCACTTCA 
GTTTTGTTAA AAAGTGAAAG 
TTGTTCCAAA CGGCCAATTT 
TTTGCTACAC CTGTTTTATC 
CATT CCGATG AAATTTTAAC 
ATTCCAACAG TTGCTTCTGA 
GGGCATGTTG CCATTACAGC 
TTGCTGTTTC CTTCTAAGGC 
TTAGTGGGTG GTGGTGAAGA 
AGAGGTAGTG ATGGCTTATC 
CAGGAAAAGG TAATGAATGA 
CCAAT CTCAT ACTCACTATC 
TCAGACAGTC AAACTGGTAT 
TCCCAAAAGC ACAATGATGG 
CCTCTCAGCC CTGAATCTAA 
GGGCAAGGTA CCT CAGATAG 
GACACTAATG AAAAAGATG C 
GGATTCCCAC AGTCCCCAAC 
TCAGAGGCAG AGGCCAGTAA 
GAATCCGAGA AGAAGGCAGT 
CTAGTGGTTC TTGTGGGTAT 
TACTTAGAGG ACAGTACATC 
ATTTCAGATG ATGTCGGAGC 
CATGCAAGTA GTGGGTTTAC 
CAGAGCTGTA CTGTTGACTT 
CACAAGAATC GATACATAAA 
CTTGCTGAAA AGGATGGCAA 
AACAGACCAA AAGCTTATAT 
TGGAGAATGA TATGGGAACA 
AAAGGAAGGA GAAAATGTGA 
TTTCTGGTCA CTCAGAAGAG 
CTAAGAAACA CAAAAATAAA 
ACACAGTATC ACTACACGCA 
CTGACCTTTG TGAGAAAGGC 
CACTGCAGTG CTGGAGTTGG 
CAGATTCAAC ACGAAGGAAC 
AGAAATTATT TGGTACAAAC 
GCCATACTTA GT AAAG AAA C 
CTCCTCATTC CTGGACCAGC 
CAGTCAAATA TACAGCAGAG 
AATCGAACTT CTTCTATCAT 
GGAGAAGGCA CAGACTACAT 
TTCATCATTA CCCAGCACCC 
GACCATAATG CCCAACTGGT 
TTTGTTTACT GGCCAAATAA 
ATGGCTGAAG AACACAAATG 
TTAGAAGCTA CACAGGATGA 
CCAAATCCAG ATAGCCCCAT 
GCTGCCAATA GGGATGGGCC 
ACTTTCTGTG CTCTGACAAC 
TACCAGGTAG CCAAGATGAT 
TATCAGTTTC TCTACAAAGT 
TCCACCTCTC TGGACAGTAA 
GAGTCTTTAG TTTAACACAG 
TTCCTAAAAT TAGGCAGGAA 
GACAGTAACT TTCATGACAT 
CTTTTTGCAA G ACT TGT AAT 
TATTTCTAAG AATGGAATTG 
TTTATAGAGG TTAGGAATTC 
GCTGTATTTG TAGCAATTAT 
AAATAAAACA CTCTTCCATA 
AGAAATAATC TGTTACTTAT 
TTTATAATTG TAGATTTTTA 
GTTTAGTTTA ATGACGTAGT 
TTGTGTTACC TAAGTCATTA 
GAAATACCTT CATTTTGAAA 
AATGGTTTTT ATCCAAGGAA 
AAAAAAAAAA AAAAAAAAAA 
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TGTGCTGTCC 
TCTTTATAAA 
TGCACGTTCT 
CATCTTCACT 
TCAGGGTTCC 
CCCAACTGCA 
AGCCTCTTCT 
TTCTTCACCT 
TAAGGCGCTT 
TTT CAATGAG 
AAATAAGTTG 
GTTTCCAGGG 
TCCAGAAAAT 
TTCGCTTAAA 
TGAAATGTTA 
TGAAGTATTG 
TCTTCCAGCT 
TTCTACAATG 
TACATCTGTA 
AGGTTTGACC 
TTCCCACCAA 
GGAGATTAAC 
AATTGATGAA 
CTCCACCAAA 
TA CAT T TGT A 
TGTTTCTCCC 
AACTTCTGAG 
TGGTGACACT 
CATTCATAAG 
TTCAGACACC 
TGAGAATTCT 
GGACAGAAGT 
AAAAGAGGAA 
AGCATGGGCA 
CCTTAATGAG 
TGATGGGAT C 
ATCATCTGTT 
TAGTAGCCAT 
TATACCCCTT 
TCTCATCTAC 
CCCTAGAGTT 
AATT CCAAT A 
TGAAGAATTT 
AGGTATTACA 
TATCGTTGCC 
ACTGACTGAT 
TGCTGCCCAA 
TAATGTGGAA 
TCAGTACTGG 
TGTG CAAGTG 
AAAGGGCTCC 
GTGGCCTGAC 
AGCCTATGCC 
AAGAACAGGC 
TGT CAACAT A 
TGAGGAGCAA 
TGAGGTGCTG 
AGGCAAAACA 
TGACTATTCT 
CCCTGTGGAA 
CAATGCCTCC 
TCTCCTTCAT 
GGTTATGATT 
AGATGAGCCT 
TCTATCTAAT 
TTATGTACTT 
TAGTAAAACT 
TATGATTGTT 
CCTTATGCAC 
C AAT CTGATG 
GATCCTCAGC 
TGGTGCAGCA 
AAAGGGGTGG 
AATCAGTCTA 
AGGATTCTGC 
TTACTTATTA 
TGGTATTTTT 
CAAACTACAG 
CAGGTTTGCT 
TGATATTCAA 
TGTAAATACT 
TATTTTACTA 
TCATTAGCTG 
ACTTTGTTTC 
GAAGTTTTTA 
TTGCAAAAAT 
AAAA 



ACTACTCATG 
ACGCTTATGT 
TCAGGGCCTG 
GTTTCTTACA 
TTATTTAGCG 
TCATTACTGC 
GATAGTGAAT 
GTTTCTGTAG 
TCTAAAAGTG 
ATGGTTTACC 
AATGCGTCTT 
TCCCTTGCTC 
AACTTTTCAG 
CCTGTGCTTA 
TCTCCTTCAA 
CTACAACCTT 
GTGCCCAGTG 
TTGCATCTCA 
CCAGTTTTTG 
AT TTCCTATG 
GTGGTACCTT 
CAGGCCCATC 
CCATTAAATA 
AGTTCTGTTA 
TCTACTGATC 
CACAGAGATG 
CTGAGTCATA 
GATGATGATG 
TGTATGTCAT 
CACGAAAACA 
GAAGAAGATA 
CCTGGTAAAT 
AATGACATTC 
GTTCTGACAA 
AATGAGACTT 
CTGGCAGCAG 
ACTAGCGAGA 
GAGTCTCGTA 
GTGATCGTGT 
TGGAGGAAAT 
ATATCCACAC 
AAGCACTTTC 
GAGACACTGA 
GCAGACAGCT 
TATGATCATA 
TATATCAATG 
GGCCCACTGA 
GTTATTGTCA 
CCTGCCGATG 
CTTGCCTATT 
CAGAAAGGAA 
ATGGGAGTAC 
AAGCGCCATG 
ACATAT AT TG 
TTTGGCTTCT 
TATGTCTTCA 
GACAGTCATA 
AAGCTAGAGA 
GCAGCCCTAA 
AGAT CAAGGG 
TATATCATGG 
ACCATCAAGG 
CCTGATGGCC 
ATAAATTGTG 
GAGGAAAAAC 
GAAGTGAGGC 
TTTGAACTTA 
CATGATGAGC 
CAACTAGAAA 
AGGCCAGGAG 
CTTGTGAGCA 
TTGCCTGATG 
GGGGACT CAC 
GTTCTGTTAT 
CGCCAAATTT 
TGTTTGAACT 
TTCTGTATTG 
AAAATGTTTG 
AGAAATATAA 
CATTTTACAA 
GCCCTAGTGT 
CTGAGTCAAG 
GTCTTACTCT 
AGCATGTAAT 
TGAGAATAAC 
AAATATAAAT 



CTGCTTCAGA 
TTTCTCAAGT 
AACCTTCTTA 
GTTCTGCAAT 
GCCCTAGCCA 
AGCCTACTCA 
TTCTTTTACC 
CTGAATTTAC 
AAATAATATA 
CTTCTGAAAG 
TACAAGAAAC 
ATACCACCAC 
TTCAACCTAC 
GTGCAAACTC 
CTCAGCTCTT 
CCTTTCAGGC 
ATCCAATATT 
TTGTAT CAAA 
ATGTGTCGCC 
CAAGTGAGAA 
CTTTGTACAG 
CCCCAAAAGG 
CACTAATAAA 
CTGGTAAGGT 
ATTCTGTTCC 
GTTCTGTAAC 
GTGCCAAATC 
GTGATGATGA 
GCTCATCCTA 
GTCTTATGGA 
ATAGAGTCAC 
CACCATCAGC 
AGACTGGTAG 
GTGATGAAGA 
CCACAGATTT 
GTGACT CAGA 
ACTCAGAAGT 
TTGGTCTAGC 
CAGCCCTGAC 
GCTTCCAGAC 
CTCCAACACC 
CAAAGCATGT 
AAGAGTTTTA 
CCAACCACCC 
GCAGGGTTAA 
CCAATTATGT 
AATCCACAGC 
TGATAACAAA 
GGAGTGAGGA 
ATACTGTGAG 
GACCCAGTGG 
CAGAGTACTC 
CAGTGGGGCC 
TGCTAGACAG 
TAAAACACAT 
TTCATGATAC 
TTCATGCCTA 
AACAATTCCA 
AGCAATGCAA 
TTGGCATTTC 
GCTATTACCA 
ATTTCTGGAG 
AAAACATGGC 
AGAGCTTTAA 
TTATAATTCA 
ACTTTCAGTG 
TAAGTGTTAT 
ATGGAGGAGT 
AAGAAAATTC 
TCTTTGCTGA 
CAAGGCAGGA 
GAAATATAGC 
ATCTGAGCAT 
CTGTTGATTT 
ATATCATTAA 
AAAATGATTG 
ATTTTAACAG 
TTTTTAGTGT 
CTTTTAATAC 
CTGCAGTATT 
CTCCATGGAC 
TTTTCTAGTT 
ACCAGTTTTC 
TTTAACTTTT 
ACCTTACCAA 
AT TGCCATTA 



GACGCTGGAA 


2820 


mmm m^ ^ ^ - ~ _ - _t — ■ 

TGAACCACCC 


2880 


TGCCTTGTCT 


2940 


ACCTGTGCAT 


3000 


TATACCAATA 


3060 


TGCCCTCTCT 


3120 


TGACACAGAT 


3180 


ATATACAACA 


3240 


TGGAAATGAG 


3300 


CACAGTCATG 


3360 


CTCTGTTTCC 


3420 


TAAGGTTTTT 


3480 


ACATACTGTC 


3540 


AGAGCCAGCA 


3600 


ATTTTATGAG 


3660 


TTCTGATGTT 


3720 


mm* m^m iw« pm * M m v. Tfc mm *mm 

GGTTGAAACC 


3780 


TTCTGCTTCA 


3840 


TACTTCTCAT 


3900 


ATATGAACCA 


3960 


TAATGATGAG 


4020 


AAGGCATGTA 


4080 


TAAGCTTATA 


4140 


ATTTGCTGGT 


4200 


TATAGGAAAT 


4260 


CTCAACAAAG 


4320 


m — ■ ■■■ mm* /mm -mmm** mm r-n 

TGATGCCGGT 


4380 


TGATGATGAC 


4440 


TAGAGAATCA 


4500 


TCAGAATAAT 


4560 


AAGTGTATCC 


4620 


AAATGGGCTA 


4680 


TGCTCTGCTT 


4740 


AAGTGGATCA 


4800 


CAGTTTTGCA 


4860 


AATAACTCCT 


4920 


GTTCCACGTT 


4980 


TGAGGGGTTG 


5040 


TTTTATCTGT 


5100 


TGCACACTTT 


5160 


TATCTTTCCA 


5220 


TGCAGATTTA 


5280 


CCAGGAAGTG 


5340 


AGACAACAAG 


5400 


GCTAGCACAG 


5460 


TGATGGCTAC 


5520 


TGAAGATTTC 


5580 


CCTCGTGGAG 


5640 


GTACGGGAAC 


5700 


GAATTTTACT 


5760 


ACGTGTGGTC 


5820 


CCTGCCAGTG 


5880 


TGTTGTCGTC 


5940 


TATGTTGCAG 


6000 


CCGT T CACAA 


6060 


ACTGGTTGAG 


6120 


TGTTAATGCA 


6180 


GCTCCTGAGC 


6240 


CAGGGAAAAG 


6300 


ATCCCTGAGT 


6360 


GAGCAATGAA 


6420 


GATGATATGG 


6480 


AGAAGATGAA 


6540 


GGT CACTCTT 


6600 


GGACTTTATC 


6660 


TCCTAAATGG 


6720 


4 — _ — mm, Mi ml m%m ^ , 

AAAAGAAGAA 


6780 


>■ — mm +mm mm, jmrn-mm. AWmi mm mm 

GACGGCAGGA 


6840 


CGTGGATGTT 


6900 


CATTGAGCAG 


6960 


AGAGAATCCA 


7020 


TGAGAGCTTA 


7080 


TGTTTTCCTC 


7140 


CCCATCACCT 


7200 


CAATGTGTGC 


7260 


AATT TTACAG 


7320 


AAAATTTCAA 


7380 


CAAATTTTTA 


7440 


AGTAGCCTGT 


7500 


CACCTAAAGT 


7560 


CAAATTTATA 


7620 


CTGTGTAATT 


7680 


TGACATTGTA 


7740 


GTGGAAAATA 


7800 


ACATTGTTCA 


7860 


AAAAAAAAAA 


7920 



403 
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Seq ID NO: 573 Protein' sequence : 
Protein Accession Eos sequence 

5 1 11 21 31 41 51 

I I I l l I 

MRILKRFLAC IQLLCVCRLD WANGYYRQQR KLVEEIGWSY TGALNQKNWG KKYPTCNSPK 60 

QSPINIDEDL TQVNVNLKKL KFQGWDKTSL ENTFIHNTGK TVEINLTNDY RVSGGVSEMV 12 0 

FKASKITFHW GKCNMSSDGS EHSLEGQKFP LEMQIYCFDA DRFSSFEEAV KGKGKLRALS 180 

10 ILFEVGTEEN LDFKAIIDGV ESVSRFGKQA ALDPFILLNL LPWSTDKYYI YNGSLTSPPC 240 

TDTVDWIVFK DTVSISESQL AVFCEVLTMQ QSGYVMLMDY LQNNFREQQY KFSRQVFSSY 300 

TGKEEIHEAV CSSEPENVQA DPENYTSLLV TWERPRWYD TMIEKFAVLY QQLDGEDQTK 3 60 

HEFLTDGYQD LGAILNNLLP NMSYVLQIVA ICTNGLYGKY SDQLIVDMPT DNPELDLFPE 42 0 

LIGTEEIIKE EEEGKDIEEG AIVNPGRDSA TNQIRKKEPQ ISTTTHYNRI GTKYNEAKTN 480 

15 RSPTRGSEFS GKGDVPNTSL NSTSQPVTKL ATEKDISLTS QTVTELPPHT VEGTSASLND 540 

GSKTVLRSPH MNLSGTAESL NTVS I TEYEE ESLLTSFKLD TGAEDSSGSS PATSAIPFIS 600 

ENISQGYIFS SENPETITYD VLIPESARNA SEDSTSSGSE ESLKDPSMEG NVWFPSSTDI 660 

TAQPDVGSGR ESFLQTNYTE IRVDESEKTT KSFSAGPVMS QGPSVTDLEM PHYSTFAYFP 72 0 

TEVTPHAFTP SSRQODLVST VNWYSQTTQ PVYNGETPLQ PSYSSEVFPL VTPMjLDNQI 780 

20 LNTTPAASSS DSALHATPVF PSVDVSFESI LSSYDGAPLL PFSSASFSSE LFRHLHTVSQ 840 

IIjPQVTSATE SDKVPLHASL PVAGGDLLLE PSLAQYSDVL STTHAASETL EFGSESGVLY 900 

KTLMFSQVEP PSSDAMMHAR SSGPEPSYAL SDNEGSQHIF TVSYSSAIPV HDSVGVTYQG 960 

SLFSGPSHIP IPKSSLITPT ASLLQPTHAL SGDGEWSGAS SDSEFLLPDT DGLTALNISS 102 0 

PVSVAEFTYT TSVFGDDNKA LSKSEIIYGN ETELQIPSFN EMVYPSESTV MPNMYDNVNK 1080 

25 LNASLQETSV SISSTKGMFP GSLAHTTTKV FDHEISQVPE NNFSVQPTHT VSQASGDTSL 1140 

KPVLSANSEP ASSDPASSEM LSPSTQLLFY ETSASFSTEV LLQPSFQASD VDTLLKTVLP 12 00 

AVPSDPILVE TPKVDKISST MLHLIVSNSA SSENMLHSTS VPVFDVSPTS HMHSASLQGL 12 60 

TISYASEKYE PVLLKSESSH QWPSLYSND ELFQTANLEI NQAHPPKGRH VFATPVLSID 132 0 

EPLNTLINKL IHSDEILTST KSSVTGKVFA GIPTVASDTF VSTDHSVPIG NGHVAI TAVS 1380 

30 PHRDGSVTST KLLFPSKATS ELSHSAKSDA GLVGGGEDGD TDDDGDDDDD DRGSDGLSIH 1440 

KCMSCSSYRE SQEKVMNDSD THENSLMDQN NPISYSLSEN SEEDNRVTSV SSDSQTGMDR 1500 

SPGKSPSANG LSQKHNDGKE ENDIQTGSAL LPLSPESKAW AVLTSDEESG SGQGTSDSLN 1560 

ENETSTDFSF ADTNEKDADG ILAAGDSEIT PGFPQSPTSS VT SENS E VFH VSEAEASNSS 1620 

HESRIGLAEG LESEKKAVIP LVIVSALTFI CLWLVGILI YWRKCFQTAH FYLEDSTSPR 1680 

35 VISTPPTPIF PISDDVGAIP I KHFPKHVAD LHASSGFTEE FETLKEFYQE VQSCTVDLGI 1740 

TAD S SNHPDN KHKNRYINIV AYDH SRVKL A QLAEKDGKLT DYINANYVDG YNRPKAY I AA 18 00 

QGPLKSTAED FWRMIWEHNV EVIVMITNLV EKGRRKCDQY WPADGSEEYG NFLVTQKSVQ 1860 

VLAYYTVRNF TLRNTKIKKG SQKGRPSGRV VTQYHYTQWP DMGVPEYSLP VLTFVRKAAY 192 0 

AKRHAVGPW VHCSAGVGRT GTYIVLDSML QQIQHEGTVN IFGFLKHIRS QRNYLVQTEE 1980 

40 QYVFIHDTLV EAILSKETEV LDSHIHAYVN ALLIPGPAGK TKLEKQFQLL SQSNIQQSDY 2040 

SAALKQCNRE KNRTSSIIPV ERSRVGISSL SGEGTDYINA SYIMGYYQSN EFIITQHPLIi 2100 

HTIKDFWRMI WDHNAQLWM I PDGQNMAED EFVYWPNKDE PINCESFKVT LMAEEHKCLS 2160 

NEEKLIIQDF ILEATQDDYV LEVRHFQCPK WPNPDSPISK TFELISVIKE EAANRDGPMI 2220 

VHDEHGGVTA GTFCALTTLM HQLEKENSVD VYQVAKMINL MRPGVFAD I E QYQFLYKVIL 22 80 

45 SLVSTRQEEN PSTSLDSNGA ALPDGNIAES LESLV 

Seq ID NO: 574 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 148-4518 

1 11 21 31 41 51 

i I 1 I I I 

CACACATACG CACGCACGAT CTCACTTCGA TCTATACACT GGAGGATTAA AACAAACAAA 60 

CAAAAAAAAC ATTTCCTTCG CTCCCCCTCC CTCTCCACTC TGAGAAGCAG AGGAGCCGCA 120 

55 CGGCGAGGGG CCGCAGACCG TCTGGAAATG CGAATCCTAA AGCGTTTCCT CGCTTGCATT 180 

CAGCTCCTCT GTGTTTGCCG CCTGGATTGG GCTAATGGAT ACTACAGACA ACAGAGAAAA 240 

CTTGTTGAAG AGATTGGCTG GTCCTATACA GGAGCACTGA ATCAAAAAAA TTGGGGAAAG 300 

AAATATCCAA CATGTAATAG CCCAAAACAA TCTCCTATCA ATATTGATGA AGATCTTACA 360 

CAAGTAAATG TGAATCTTAA GAAACTTAAA TTTCAGGGTT GGGATAAAAC AT CATTGGAA 420 

60 AACACATTCA T T CAT AACAC TGGGAAAACA GTGGAAATTA ATCTCACTAA TGACTACCGT 480 

GTCAGCGGAG GAGTTTCAGA AATGGTGTTT AAAGCAAGCA AGATAACTTT TCACTGGGGA 540 

AAATGCAATA TGTCAT CTGA TGGATCAGAG CATAGTTTAG AAGGACAAAA ATTTCCACTT 60 0 

GAGATGCAAA TCTACTGCTT TGATGCGGAC CGATTTTCAA GTTTTGAGGA AGCAGTCAAA 660 

GGAAAAGGGA AGTTAAGAGC TTTATCCATT TTGTTTGAGG TTGGGACAGA AGAAAATTTG 72 0 

65 GATTT CAAAG CGATTATTGA TGGAGTCGAA AGTGTTAGTC GTTTTGGGAA GCAGGCTGCT 780 

TTAGATCCAT TCATACTGTT GAACCTTCTG CCAAACT CAA CTGACAAGTA TTACATTTAC 840 

AATGGCT CAT TGACATCTCC TCCCTGCACA GACACAGTTG ACTGGATTGT TT TTAAAG AT 900 

ACAGTTAGCA TCTCTGAAAG CCAGTTGGCT GTTTTTTGTG AAGTTCTTAC AATGCAACAA 960 

TCTGGTTATG TCATGCTGAT GGACTACTTA CAAAACAATT TTCGAGAGCA ACAGTACAAG 1020 

70 TTCTCTAGAC AGGTGTTTTC CTCATACACT GGAAAGGAAG AGATTCATGA AGCAGTTTGT 1080 

AGTTCAGAAC CAGAAAATGT TCAGGCTGAC CCAGAGAATT ATACCAGCCT TCTTGTTACA 1140 

TGGGAAAGAC CTCGAGTCGT TTATGATACC ATGATTGAGA AGTTTGCAGT TTTGTACCAG 1200 

CAGTTGGATG GAGAGGACCA AACCAAGCAT GAATTTTTGA CAGATGGCTA TCAAGACTTG 12 60 

GGTGCTATTC TCAATAATTT GCTACCCAAT ATGAGTTATG TTCTTCAGAT AGTAGCCATA 132 0 

75 TGCACTAATG GCTTATATGG AAAATACAGC GACCAACTGA TTGTCGACAT GCCTACTGAT 13 80 

AATCCTGAAC TTGATCTTTT CCCTGAATTA ATTGGAACTG AAGAAATAAT CAAGGAGGAG 1440 

GAAGAGGGAA AAGACATTGA AGAAGGCGCT ATTGTGAATC CTGGTAGAGA CAGTGCTACA 1500 

AACCAAATCA GGAAAAAGGA ACCCCAGATT TCTACCACAA CACA CT AC AA TCGCATAGGG 1560 

ACGAAATACA ATGAAGCCAA GACTAACCGA TCCCCAACAA GAGGAAGTGA ATTCTCTGGA 1620 

80 AAGGGTGATG TTCCCAATAC ATCTTTAAAT TCCACTTCCC AACCAGTCAC TAAATTAGCC 1680 

ACAGAAAAAG ATATTTCCTT GACTTCTCAG ACTGTGACTG AACTGCCACC TCACACTGTG 1740 

GAAGGTACTT CAGCCTCTTT AAATGATGGC TCTAAAACTG TTCTTAGATC TCCACATATG 1800 

AACTTGTCGG GGACTGCAGA ATCCTTAAAT ACAGTTTCTA TAACAGAATA TGAGGAGGAG 1860 

AGTTTATTGA CCAGTTTCAA GCTTGATACT GGAGCTGAAG ATTCTTCAGG CTCCAGTCCC 1920 

85 GCAACTTCTG CTATCCCATT CATCTCTGAG AACATATCCC AAGGGTATAT ATTTTCCTCC 1980 

GAAAACCCAG AGACAATAAC ATATGATGTC CTTATACCAG AATCTGCTAG AAATGCTTCC 2040 

GAAGATTCAA CTTCATCAGG TTCAGAAGAA TCACTAAAGG ATCCTTCTAT GGAGGGAAAT 210 0 
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GTGTGGTTTC CTAGCTCTAC 
AGCTTTCTCC AGACTAATTA 
TCCTTTTCTG CAGGCCCAGT 
CATTATTCTA CCTTTGCCTA 
TCCAGACAAC AGGATTTGGT 
GTATACAATG CAGAGGCCAG 
TTGGAATCCG AGAAGAAGGC 
TGTCTAGTGG TTCTTGTGGG 
TTTTACTTAG AGGACAGTAC 
CCAATTTCAG ATGATGTCGG 
TTACATGCAA GTAGTGGGTT 
GTGCAGAGCT GTACTGTTGA 
AAGCACAAGA ATCGATACAT 
CAGCTTGCTG AAAAGGATGG 
TACAACAGAC CAAAAGCTTA 
TTCTGGAGAA TGATATGGGA 
GAGAAAGGAA GGAGAAAATG 
AACTTTCTGG TCACTCAGAA 
ACTCTAAGAA ACACAAAAAT 
GTCACACAGT ATCACTACAC 
GTGCTGACCT TTGTGAGAAA 
GTCCACTGCA GTGCTGGAGT 
CAGCAGATTC AACACGAAGG 
CAAAGAAATT ATT TGGTACA 
GAGGCCATAC TTAGTAAAGA 
GCACTCCTCA TTCCTGGACC 
AGCCAGTCAA ATATACAGCA 
AAGAAT CG AA CTTCTTCTAT 
AGTGGAGAAG GCACAGACTA 
GAATTCATCA TTACCCAGCA 
TGGGACCATA ATGCCCAACT 
GAATTTGTTT ACTGGCCAAA 
CTTATGGCTG AAGAACACAA 
ATCTTAGAAG CTACACAGGA 
TGGCCAAATC CAGATAGCCC 
GAAGCTGCCA AT AGGGATGG 
GGAACTTTCT GTGCTCTGAC 
GTTTACCAGG TAGCCAAGAT 
CAGTATCAGT TTCTCTACAA 
CCATCCACCT CTCTGGACAG 
TTAGAGTCTT TAGTTTAACA 
CTCTTCCTAA AATTAGGCAG 
CCTGACAGTA ACTTTCATGA 
TGCCTTTTTG CAAGACTTGT 
CAGTATTTCT AAGAATGGAA 
CAATTTATAG AGGTTAGGAA 
TTAGCTGTAT TTGTAGCAAT 
TGTAAATAAA ACACTCTTCC 
AGTAGAAATA ATCTGTTACT 
ATATTTATAA TTGTAGATTT 
ATTGTTTAGT TTAATGACGT 
GTATTGTGTT ACCTAAGTCA 
ATAGAAATAC CTTCATTTTG 
TCAAATGGTT TTTATCCAAG 
AAAAAAAAAA AAAAAAAAAA 
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AGACATAACA 
CACTGAGATA 
GATGTCACAG 
CTTCCCAACT 
CTCCACGGTC 
TAATAGTAGC 
AGTTATACCC 
TATTCTCATC 
ATCCCCTAGA 
AGCAATTCCA 
TACTGAAGAA 
CTTAGGTATT 
AAATATCGTT 
CAAACTGACT 
TATTGCTGCC 
ACATAATGTG 
TGAT CAGTAC 
GAGTGTGCAA 
AAAAAAGGGC 
GCAGTGGCCT 
GGCAGCCTAT 
TGGAAGAACA 
AACTGTCAAC 
AACTGAGGAG 
AACTGAGGTG 
AG CAGG C AAA 
GAGTGACTAT 
CATCCCTGTG 
CAT CAATGCC 
CCCTCTCCTT 
GGTGGTTATG 
TAAAGATGAG 
ATGTCTATCT 
TGATTATGTA 
CATTAGTAAA 
GCCTATGATT 
AACCCTTATG 
GATCAATCTG 
AGTGATCCTC 
TAATGGTGCA 
CAGAAAGGGG 
GAAAATCAGT 
CATAGGATTC 
AATTTACTTA 
TTGTGGTATT 
TTCCAAACTA 
TAT CAGGTTT 
ATATGATATT 
TATTGTAAAT 
TTATATTTTA 
AGTTCATTAG 
TTAACTTTGT 
AAAGAAGTTT 
GAATTGCAAA 
AAAAAAA 



GCACAGCCCG 
CGTGTTGATG 
GGTCCCTCAG 
GAGGTAACAC 
AACGTGGTAT 
CATGAGT CTC 
CTTGTGATCG 
TACTGGAGGA 
GTTATATCCA 
ATAAAGCACT 
TTTGAGACAC 
ACAGCAGACA 
GCCTATGATC 
GATTATATCA 
CAAGGCCCAC 
GAAGTTATTG 
TGGCCTGCCG 
GTGCTTGCCT 
TCCCAGAAAG 
GACATGGGAG 
GCCAAGCGCC 
GGCACATATA 
ATATTTGGCT 
CAATATGTCT 
CTGGACAGTC 
ACAAAGCTAG 
TCTGCAGCCC 
GAAAGATCAA 
TCCTATATCA 
CATACCATCA 
ATTCCTGATG 
CCTATAAATT 
AATGAGGAAA 
CTTGAAGTGA 
ACTTTTGAAC 
GTTCATGATG 
CACCAACTAG 
ATGAGGCCAG 
AGCCTTGTGA 
GCATTGCCTG 
TGGGGGGACT 
CTAGTTCTGT 
TGCCGCCAAA 
TTATGTTTGA 
TTTTTCTGTA 
CAGAAAATGT 
GCTAGAAATA 
CAACATTTTA 
ACTGCCCTAG 
CTACTGAGTC 
CTGGTCTTAC 
TTCAGCATGT 
TTATGAGAAT 
AATAAATATA 



ATGTTGGATC 
AATCTGAGAA 
TTACAGATCT 
CTCATGCTTT 
ACTCGCAGAC 
GTATTGGTCT 
TGTCAGCCCT 
AATGCTTCCA 
CACCTCCAAC 
TTCCAAAGCA 
TGAAAGAGTT 
GCTCCAACCA 
ATAGCAGGGT 
ATGCCAATTA 
TGAAATCCAC 
TCATGATAAC 
ATGGGAGTGA 
ATTATACTGT 
GAAGACCCAG 
TACCAGAGTA 
ATGCAGTGGG 
TTGTGCTAGA 
TCTTAAAACA 
TCATT CATGA 
ATATT CATGC 
AGAAACAATT 
TAAAGCAATG 
GGGTTGGCAT 
TGGGCTATTA 
AGGATTTCTG 
GCCAAAACAT 
GTGAGAGCTT 
AACTTATAAT 
GGCACTTTCA 
TTATAAGTGT 
AGCATGGAGG 
AAAAAGAAAA 
GAGTCTTTGC 
GCACAAGGCA 
ATGGAAATAT 
CACATCTGAG 
TATCTGTTGA 
TTTATATCAT 
ACTAAAATGA 
TTGATTTTAA 
TTGTTTTTAG 
TAACTTTTAA 
CAACTGCAGT 
TGTCTCCATG 
AAGTTTTCTA 
TCTACCAGTT 
AATTTTAACT 
AACACCTTAC 
AATATTGCCA 



AGGCAGAGAG 2160 

GACAACCAAG 2220 

GGAAATGCCA 2280 

TACCCCATCC 2340 

AACCCAACCG 2400 

AGCTGAGGGG 2460 

GACTTTTATC 2520 

GACTGCACAC 25 80 

ACCTATCTTT 2 640 

TGTTGCAGAT 2700 

TTACCAGGAA 2760 

CCCAGACAAC 282 0 

TAAGCTAGCA 2 880 

TGTTGATGGC 2 940 

AGCTGAAGAT 3 0 00 

AAACCTCGTG 3 060 

GGAGTACGGG 3120 

GAGGAATTTT 3180 

TGGACGTGTG 3240 

CTCCCTGCCA 3300 

GCCTGTTGTC 33 60 

CAGTATGTTG 3420 

CATCCGTTCA 3 480 

TACACTGGTT 3540 

CTATGTTAAT 360 0 

CCAGCTCCTG 3660 

CAACAGGGAA 3720 

TTCATCCCTG 3780 

CCAGAGCAAT 3840 

GAGGATGATA 3900 

GGCAGAAGAT 3960 

TAAGGTCACT 4020 

TCAGGACTTT 4080 

GTGTCCTAAA 4140 

T ATAAAAG AA 4200 

AGTGACGGCA 42 60 

TTCCGTGGAT 4320 

TGACATTGAG 4380 

GGAAGAGAAT 4440 

AGCTGAGAGC 450 0 

CATTGTTTTC 4560 

TTTCCCATCA 4620 

TAACAATGTG 4680 

TTGAATTTTA 4740 

CAGAAAATTT 4800 

TGTCAAATTT 48 60 

TACAGT AG CC 4920 

ATTCACCTAA 4 980 

GACCAAATTT 5040 

GTTCTGTGTA 5100 

TTCTGACATT 5160 

TTTGTGGAAA 5220 

CAAACATTGT 5280 

TTAAAAAAAA 5340 
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Seq ID NO: 575 Protein sequence: 
Protein Accession #: Eos sequence 



65 



70 



75 



80 



85 



MRILKRFLAC 
QSPINIDEDL 
FKASKITFHW 
ILFEVGTEEN 
TDTVDWIVFK 
TGKEEIHEAV 
HEFLTDGYQD 
LIGTEEIIKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
PLVIVSALTF 
PIKHFPKHVA 
VAYDHSRVKL 
VEVIVMITNL 
GSQKGRPSGR 
TGTYIVLDSM 
VLDSHIHAYV 
VERSRVGISS 
MIPDGQNMAE 
VLEVRHFQCP 
MHQLEKENSV 
AALPDGNIAE 



11 
I 

IQLLCVCRLD 
TQVNVNLKKL 
GKCNMSSDGS 
LDFKAI IDGV 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKD I EEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDLVST 
ICLWLVGIL 
DLHASSGFTE 
AQLAEKDGKL 
VEKGRRKCDQ 
WTQYHYTQW 
LQQIQHEGTV 
NALLIPGPAG 
LSGEGTDYIN 
DEFVYWPNKD 
KWPNPDSPIS 
DVYQVAKMIN 
SLESLV 



21 

1 

WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLLV 
NMSYVLQIVA 
AIVNPGRDSA 
NSTSQPVTKL 
NTVSITEYEE 
VLIPESARNA 
IRVDESEKTT 
VNWYSQTTQ 
IYWRKCFQTA 
EFETLKEFYQ 
TDYINANYVD 
YWPADGSEEY 
PDMGVPEYSL 
NIFGFLKHIR 
KTKLEKQFQL 
ASYIMGYYQS 
EPINCESFKV 
KTFELISVIK 
LMRPGVFADI 



31 

1 

KLVEEIGWSY 
ENTF I HNTGK 
LEMQIYCFDA 
ALDPFILLNL 
QSGYVMLMDY 
TWERPRWYD 
ICTNGLYGKY 
TNQIRKKEPQ 
ATEKDISLTS 
ESLLTSFKLD 
SEDSTSSGSE 
KSPSAGPVMS 
PVYNAEASNS 
HFYLEDSTSP 
EVQSCTVDLG 
GYNRPKAYIA 
GNFLVTQKSV 
PVLTFVRKAA 
SQRNYLVQTE 
IiSQSNIQQSD 
NEFIITQHPL 
TLMAEEHKCL 
EEAANRDGPM 
EQYQFLYKVI 



41 
I 

TGALNQKNWG 
TVEINLTNDY 
DRFSSFEEAV 
LPNSTDKYYI 
LQNNFREQQY 
TMIEKFAVLY 
SDQLIVDMPT 
ISTTTHYNRI 
QTVTELPPHT 
TGAEDSSGSS 
ESLKDPSMEG 
QGPSVTDLEM 
SHESRIGLAE 
RVISTPPTPI 
ITADSSNHPD 
AQGPLKSTAE 
QVLAYYTVRN 
YAKRHAVGPV 
EQYVFIHDTL 
YSAALKQCNR 
LHTIKDFWRM 
SNEEKLIIQD 
IVHDEHGGVT 
LSLVSTRQEE 



51 

I 

KKYPTCNSPK 60 

RVSGGVSEMV 120 

KGKGKLRALS 180 

YNGSLTSPPC 240 

KFSRQVFSSY 300 

QQLDGEDQTK 360 

DNPELDLFPE 420 

GTKYNEAKTN 480 

VEGTSASLND 540 

PATSAIPFIS 600 

NVWFPSSTDI 660 

PHYSTFAYFP 720 

GLESEKKAVI 780 

FPISDDVGAI 840 

NKHKNRY IN I 900 

DFWRMIWEHN 960 

FTLRNTKIKK 1020 

WHCSAGVGR 10 80 

VEAILSKETE 1140 

EKNRTSSIIP 1200 

IWDHNAQLW 1260 

FILEATQDDY 1320 

AGTFCALTTL 1380 

NPSTSLDSNG 1440 
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Seq ID NO: 576 DNA sequence 

Nucleic Acid Accession #: EOS sequence 

Coding sequence: 148-4494 

•J 

1 11 21 31 41 51 

I I I I I I 

CACACATACG CACGCACGAT CTCACTTCGA TCTATACACT GGAGGATTAA AACAAACAAA 60 

CAAAAAAAAC ATTTCCTTCG CTCCCCCTCC CTCTCCACTC TGAGAAGCAG AGGAGCCGCA 12 0 

10 CGGCGAGGGG CCGCAGACCG TCTGGAAATG CGAATCCTAA AGCGTTTCCT CGCTTGCATT 180 

CAGCTCCTCT GTGTTTGCCG CCTGGATTGG GCTAATGGAT ACTACAGACA ACAGAGAAAA 240 

CTTGTTGAAG AGATTGGCTG GTCCTATACA GGAGCACTGA ATCAAAAAAA TTGGGGAAAG 300 

AAAT AT CCAA CATGTAATAG CCCAAAACAA TCTCCTATCA ATATTGATGA AGATCTTACA 3 60 

CAAGTAAATG TGAATCTTAA GAAACTTAAA TTTCAGGGTT GGGATAAAAC ATCATTGGAA 420 

15 AACACATT C A T T CAT AACAC TGGGAAAACA GTGGAAATTA ATCTCACTAA TGACTACCGT 480 

GTCAGCGGAG GAGTTTCAGA AATGGTGTTT AAAGCAAGCA AGATAACTTT T C ACTGGGG A 540 

AAATGCAATA TGTCATCTGA TGGATCAGAG CATAGTTTAG AAGGACAAAA ATTTCCACTT 60 0 

GAGATGCAAA TCTACTGCTT TGATGCAGAC CGATTTTCAA GTTTTGAGGA AGCAGTCAAA 660 

GGAAAAGGGA AGTTAAGAGC TTTATCCATT TTGTTTGAGG TTGGGACAGA AGAAAATTTG 720 

20 GATTTCAAAG CGATTATTGA TGGAGTCGAA AGTGTTAGTC GTTTTGGGAA GCAGGCTGCT 780 

TTAGATCCAT TCATACTGTT GAACCTTCTG CCAAACTCAA CTGACAAGTA TTACATTTAC 840 

AATGGCTCAT TGACATCTCC TCCCTGCACA GACACAGTTG ACTGGATTGT TTTTAAAGAT 90 0 

ACAGTTAGCA TCTCTGAAAG CCAGTTGGCT GTTTTTTGTG AAGTTCTTAC AATGCAACAA 960 

TCTGGTTATG TCATGCTGAT GGACTACTTA CAAAACAATT TT CGAGAGC A ACAGTACAAG 102 0 

25 TTCTCTAGAC AGGTGTTTTC CTCATACACT GGAAAGGAAG AGATTCATGA AGCAGTTTGT 10 80 

AGTTCAGAAC CAGAAAATGT TCAGGCTGAC CCAGAGAATT ATACCAGCCT T CTTGT T AC A 114 0 

TGGGAAAGAC CTCGAGTCGT TTATGATACC ATGATTGAGA AGTTTGCAGT TTTGTACCAG 12 0 0 

CAGTTGGATG GAGAGGACCA AACCAAGCAT GAATTTTTGA CAGATGGCTA TCAAGACTTG 1260 

GGTGCTATTC T CAATAAT TT GCTACCCAAT ATGAGTTATG TTCTTCAGAT AGTAGCCATA 132 0 

30 TGCACTAATG GCTTATATGG AAAATACAGC GACCAACTGA TTGTCGACAT GCCTACTGAT 1380 

AATCCTGAAC TTGATCTTTT CCCTGAATTA ATTGGAACTG AAGAAATAAT CAAGGAGGAG 1440 

GAAGAGGGAA AAGACATTGA AGAAGGCGCT ATTGTGAATC CTGGTAGAGA CAGTGCTACA 1500 

AACCAAATCA GGAAAAAGGA ACCCCAGATT TCTACCACAA CACACTACAA TCGCATAGGG 1560 

ACGAAATACA ATGAAGCCAA GACTAACCGA TCCCCAACAA GAGGAAGTGA ATTCTCTGGA 1620 

35 AAGGGTGATG TTCCCAATAC ATCTTTAAAT TCCACTTCCC AACCAGTCAC TAAATTAGCC 1680 

ACAGAAAAAG ATATTTCCTT GACTTCTCAG ACTGTGACTG AACTGCCACC TCACACTGTG 1740 

GAAGGTACTT CAGCCTCTTT AAATGATGGC TCTAAAACTG TTCTTAGATC TCCACATATG 1800 

AACTTGT CGG GGACTGCAGA ATCCTTAAAT ACAGTTTCTA TAACAGAATA TGAGGAGGAG 1860 

AGTTTATTGA CCAGTTTCAA GCTTGATACT GGAGCTGAAG ATTCTTCAGG CTCCAGTCCC 1920 

40 GCAACTTCTG CTATCCCATT CATCTCTGAG AACATATCCC AAGGGTATAT ATTTTCCTCC 1980 

GAAAACCCAG AGACAATAAC ATATGATGTC CTTATACCAG AATCTGCTAG AAATGCTTCC 2040 

GAAGATTCAA CTTCATCAGG TTCAGAAGAA TCACTAAAGG ATCCTTCTAT GGAGGGAAAT 2100 

GTGTGGTTTC CTAGCTCTAC AGACATAACA GCACAGCCCG ATGTTGGATC AGGCAGAGAG 2160 

AGCTTTCTCC AGACTAATTA CACTGAGATA CGTGTTGATG AATCTGAGAA GACAACCAAG 2220 

45 TCCTTTTCTG CAGGCCCAGT GATGTCACAG GGTCCCTCAG TTACAGATCT GGAAATGCCA 2280 

CATTATTCTA CCTTTGCCTA CTTCCCAACT GAGGTAACAC CTCATGCTTT TACCCCATCC 2340 

TCCAGACAAC AGGATTTGGT CTCCACGGTC AACGTGGTAT ACTCGCAGAC AACCCAACCG 2400 

GTATACAATG AGGCCAGTAA TAGTAGCCAT GAGTCTCGTA TTGGTCTAGC TGAGGGGTTG 2460 

GAATCCGAGA AGAAGGCAGT TATACCCCTT GTGATCGTGT CAGCCCTGAC TTTTATCTGT 252 0 

50 CTAGTGGTTC TTGTGGGTAT TCTCATCTAC TGGAGGAAAT GCTTCCAGAC TGCACACTTT 2580 

TACTTAGAGG ACAGT ACAT C CCCTAGAGTT ATATCCACAC CTCCAACACC TATCTTTCCA 2640 

ATTT CAGATG ATGTCGGAGC AATTCCAATA AAGCACTTTC CAAAGCATGT TGCAGATTTA 2700 

CATGCAAGTA GTGGGTTTAC TGAAGAATTT GAGGAAGTGC AGAGCTGTAC TGTTGACTTA 2760 

GGTATTACAG CAGACAGCTC CAACCACCCA GACAACAAGC ACAAGAATCG ATACATAAAT 2 82 0 

55 ATCGTTGCCT ATGATCATAG CAGGGTTAAG CTAGCACAGC TTGCTGAAAA GGATGGCAAA 2880 

CTGACTGATT ATATCAATGC CAAT TATGTT GATGGCTACA ACAGACCAAA AGCTTATATT 2940 

GCTGCCCAAG GCCCACTGAA ATCCACAGCT GAAGATTTCT GGAGAATGAT ATGGGAACAT 3000 

AATGTGGAAG TTATTGTCAT GATAACAAAC CTCGTGGAGA AAGGAAGGAG AAAATGTGAT 3060 

CAGTACTGGC CTGCCGATGG GAGTGAGGAG TACGGGAACT TT CTGGTCAC TCAGAAGAGT 3120 

60 GTGCAAGTGC TTGCCTATTA TACTGTGAGG AATTTTACTC TAAGAAACAC AAAAATAAAA 3180 

AAGGGCTCCC AGAAAGGAAG ACCCAGTGGA CGTGTGGTCA CACAGTATCA CTACACGCAG 324 0 

TGGCCTGACA TGGGAGTACC AGAGTACTCC CTGCCAGTGC TGACCTTTGT GAGAAAGGCA 3300 

GCCTATGCCA AGCGCCATGC AGTGGGGCCT GTTGTCGTCC ACTGCAGTGC TGGAGTTGGA 3360 

AGAACAGGCA CATATATTGT GCTAGACAGT ATGTTGCAGC AGATTCAACA CGAAGGAACT 3420 

65 GTCAACATAT TTGGCTTCTT AAAACACATC CGTTCACAAA GAAATTATTT GGTACAAACT 3480 

GAGGAGCAAT ATGTCTTCAT TCATGATACA CTGGTTGAGG CCATACTTAG TAAAGAAACT 3540 

GAGGTGCTGG ACAGTCATAT TCATGCCTAT GTTAATGCAC TCCTCATTCC TGGACCAGCA 3600 

GGCAAAACAA AGCTAGAGAA ACAATT CCAG CTCCTGAGCC AGTCAAATAT ACAGCAGAGT 3 660 

GACTATTCTG CAGCCCTAAA GCAATGCAAC AGGGAAAAGA ATCGAACTTC TTCTATCATC 3720 

70 CCTGTGGAAA GAT CAAGGGT TGGCATTTCA TCCCTGAGTG GAGAAGGCAC AGACTACATC 3 780 

AATGCCTCCT AT AT CATGGG CTATTACCAG AGCAATGAAT TCATCATTAC CCAGCACCCT 3840 

CTCCTTCATA CCATCAAGGA TTTCTGGAGG ATGATATGGG ACCATAATGC CCAACTGGTG 3 900 

GTTATGATTC CTGATGGCCA AAACATGGCA GAAGATGAAT TTGTTTACTG GCCAAATAAA 3 960 

GATGAGCCTA TAAATTGTGA GAGCTTTAAG GTCACTCTTA TGGCTGAAGA ACACAAATGT 402 0 

75 CTATCTAATG AGGAAAAACT TATAATTCAG GACTTTATCT TAGAAGCTAC ACAGGATGAT 4080 

TATGTACTTG AAGTGAGGCA CTTTCAGTGT CCTAAATGGC CAAATCCAGA TAGCCCCATT 4140 

AGTAAAACTT TTGAACTTAT AAGTGTTATA AAAGAAGAAG CTGCCAATAG GGATGGGCCT 4200 

ATGATTGTTC ATGATGAGCA TGGAGGAGTG ACGGCAGGAA CTTTCTGTGC TCTGACAACC 4260 

CTTATGCACC AACTAGAAAA AGAAAATTCC GTGGATGTTT ACCAGGTAGC CAAGATGATC 4320 

80 AATCTGATGA GGCCAGGAGT CTTTGCTGAC ATTGAGCAGT ATCAGTTTCT CTACAAAGTG 4380 

ATCCTCAGCC TTGTGAGCAC AAGG CAGGAA GAGAATCCAT CCACCTCTCT GGACAGTAAT 4440 

GGTGCAGCAT TGCCTGATGG AAATATAGCT GAGAGCTTAG AGTCTTTAGT TTAACACAGA 4500 

AAGGGGTGGG GGGACTCACA TCTGAGCATT GTTTTCCTCT TCCTAAAATT AGGCAGGAAA 4560 

ATCAGT CTAG TTCTGTTATC TGTTGATTTC CCATCACCTG ACAGTAACTT TCATGACATA 4620 

85 GGATTCTGCC GCCAAATTTA TATCATTAAC AATGTGTGCC TTTTTGCAAG ACTTGTAATT 4680 

TACTTATTAT GTTTGAACTA AAATGATTGA ATTTTACAGT ATTTCTAAGA ATGGAATTGT 4740 

GGTATTTTTT T CTGTATTGA TTTTAACAGA AAATTTCAAT TTATAGAGGT TAGGAATTCC 4800 
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AAACTACAGA AAATGTTTGT TTTTAGTGTC AAATTTTTAG CTGTATTTGT AGCAATT AT C 4 860 

AGGTTTGCTA GAAATATAAC TTTTAATACA GTAGCCTGTA AATAAAACAC TCTTCCATAT 492 0 

GATATTCAAC ATTTTACAAC TGCAGTATTC ACCTAAAGTA GAAATAATCT GTTACTTATT 4980 

GTAAATACTG CCCTAGTGTC TCCATGGACC AAATTTATAT TTATAATTGT AGATTTT TAT 5040 

ATTTTACTAC TGAGTCAAGT TTTCTAGTTC TGTGTAATTG TTTAGTTTAA TGACGTAGTT 5100 

CATTAGCTGG TCTTACTCTA CCAGTTTTCT GACATTGTAT TGTGTTACCT AAGTCATTAA 5160 

CTTTGTTTCA GCATGTAATT TTAACTTTTG TGGAAAATAG AAATACCTTC ATTTTGAAAG 522 0 

AAGTTTTTAT GAGAATAACA CCTTACCAAA CAT TGTTCAA ATGGTTTTTA TCCAAGGAAT 5280 

TGCAAAAATA AATATAAATA TTGCCATTAA AAAAAAAAAA AAAAAAAAAA AAAAAAAAAA 5340 
AAA 

Seq ID NO: 577 Protein sequence: 
Protein Accession #: EOS sequence 

1 11 21 31 41 51 

I I I I I I 

MRILKRFLAC IQLLCVCRLD WANGYYRQQR KLVEEIGWSY TGALNQKNWG KKYPTCNSPK 60 

QSPINIDEDL TQVNVNLKKL KFQGWDKTSL ENTFIHNTGK TVEINLTNDY RVSGGVSEMV 12 0 

FKASKITFHW GKCNMSSDGS EHSLEGQKFP LEMQIYCFDA DRFSSFEEAV KGKGKLRALS 180 

ILFEVGTEEN LDFKAIIDGV ESVSRFGKQA ALDPFILLNL LPNSTDKYYI YNGSLTSPPC 240 

TDTVDWIVFK DTVSISESQIi AVFCEVLTMQ QSGYVMLMDY LQNNFREQQY KFSRQVFSSY 300 

TGKEEIHEAV CSSEPENVQA DPENYTSLLV TWERPRWYD TMIEKFAVLY QQLDGEDQTK 360 

HEFLTDGYQD LGAILNNLLP NMSYVLQIVA ICTNGLYGKY SDQLIVDMPT DNPELDLFPE 420 

LIGTEEIIKE EEEGKDIEEG AIVNPGRDSA TNQIRKKEPQ ISTTTHYNRI GTKYNEAKTN 480 

RSPTRGSEFS GKGDVPNTSL NSTSQPVTKL ATEKDISLTS QTVTELPPHT VEGTSASLND 540 

GSKTVLRSPH MNLSGTAESL NTVSITEYEE ESLLTSFKLD TGAEDSSGSS PATSAIPFIS 600 

ENISQGYIFS SENPETITYD VLIPESARNA SEDSTSSGSE ESLKDPSMEG NVWFPSSTDI 660 

TAQPDVGSGR ESFLQTNYTE IRVDESEKTT KSFSAGPVMS QGPSVTDLEM PHYSTFAYFP 720 

TEVTPHAFTP SSRQQDLVST VNWYSQTTQ PVYNEASNSS HESRIGLAEG LESEKKAVIP 780 

LVIVSALTFI CLWLVGILI YWRKCFQTAH FYLEDSTSPR VISTPPTPIF PISDDVGAIP 840 

I KHFPKHVAD LHASSGFTEE FEEVQSCTVD LGITADSSNH PDNKHKNRY I N I VAYDHSRV 900 

KLAQLAEKDG KLTDYINANY VDGYNRPKAY IAAQGPLKST AEDFWRMIWE HNVEVIVMIT 960 

NLrVEKGRRKC DQYWPADGSE EYGNFLVTQK SVQVLAYYTV RNFTLRNTKI KKGSQKGRPS 102 0 

GRWTQYHYT QWPDMGVPEY SLPVLTFVRK AAYAKRHAVG PVWHCSAGV GRTGTYIVLD 1080 

SMhQQIQHEG TVNIFGFLKH IRSQRNYLVQ TEEQYVFIHD TLVEAILSKE TEVLDSHIHA 1140 

YVNALLIPGP AGKTKLEKQF QLLSQSNIQQ SDYSAALKQC NREKNRTSSI IPVERSRVGI 1200 

SSLSGEGTDY INASYIMGYY QSNEFIITQH PLUHTIKDFW RMIWDHNAQL WMIPDGQNM 1260 

AEDEFVYWPN KDEPINCESF KVTLMAEEHK CLSNEEKLII QDFILEATQD DYVLEVRHFQ 132 0 

CPKWPNPDSP ISKTFELISV I KEEAANRDG PMIVHDEHGG VTAGTFCALT TLMHQLEKEN 1380 

SVDVYQVAKM INLMRPGVFA DIEQYQFLYK VILSLVSTRQ EENPSTSLDS NGAALPDGNI 1440 
AESLESLV 



Seq ID NO: 578 DNA sequence 

Nucleic Acid Accession #: EOS sequence 

Coding sequence: 501-4514 

1 11 21 31 41 51 

! I I I 1 I 

CACACATACG CACGCACGAT CTCACTTCGA TCTATACACT GGAGGATTAA AACAAACAAA 60 

CAAAAAAAAC ATTTCCTTCG CTCCCCCTCC CTCTCCACTC TGAGAAGCAG AGGAGCCGCA 120 

CGGCGAGGGG CCGCAGACCG TCTGGAAATG CGAATCCTAA AGCGTTTCCT CGCTTGCATT 180 

CAGCTCCTCT GTGTTTG CCG CCTGGATTGG GCTAATGGAT ACTACAGACA ACAGAGAAAA 240 

CTTGTTGAAG AGATTGGCTG GTCCTATACA GGAGCACTGA ATCAAAAAAT TGGGGAAAGA 300 

AATATCCAAC ATGTAATAGC CCAAAACAAT CTCCTATCAA TATTGATGAA GATCTTACAC 360 

AAGTAAATGT GAATCTTAAG AAACTTAAAT TTCAGGGTTG GGATAAAACA TCATTGGAAA 420 

ACACATTCAT TCATAACACT GGGAAAACAG TGGAAATTAA TCTCACTAAT GACTACCGTG 480 

TCAGCGGAGG AGTTTCAGAA ATGGTGTTTA AAGCAAGCAA GATAACTTTT CACTGGGGAA 540 

AATGCAATAT GTCATCTGAT GGATCAGAGC ATAGTTTAGA AGGACAAAAA TTTCCACTTG 600 

AGATGCAAAT CTACTGCTTT GATGCGGACC GATTTTCAAG TTTTGAGGAA GCAGTCAAAG 660 

GAAAAGGGAA GTTAAGAGCT TTATCCATTT TGTTTGAGGT TGGGACAGAA GAAAATTTGG 720 

ATTTCAAAGC GATTATTGAT GGAGTCGAAA GTGTTAGTCG TTTTGGGAAG CAGGCTGCTT 780 

TAGATCCATT CATACTGTTG AACCTTCTGC CAAACTCAAC TGACAAGTAT TACATTTACA 840 

ATGGCTCATT GACATCTCCT CCCTGCACAG ACACAGTTGA CTGGATTGTT TTTAAAGATA 90 0 

CAGTTAGCAT CTCTGAAAGC CAGTTGGCTG TTTTTTGTGA AGTTCTTACA ATGCAACAAT 960 

CTGGTTATGT CATGCTGATG GACTACTTAC AAAACAATTT TCGAGAGCAA CAGTACAAGT 1020 

TCTCTAGACA GGTGTTTTCC TCATACACTG GAAAGGAAGA GATTCATGAA GCAGTTTGTA 1080 

GTTCAGAACC AGAAAATGTT CAGGCTGACC CAGAGAATTA TACCAGCCTT CTTGTTACAT 1140 

GGGAAAGACC TCGAGTCGTT TATGATACCA TGATTGAGAA GTTTGCAGTT TTGTACCAGC 1200 

AGTTGGATGG AGAGGACCAA ACCAAGCATG AATTTTTGAC AG ATGG CTAT CAAGACTTGG 1260 

GTGCTATTCT CAATAATTTG CTACCCAATA TGAGTTATGT TCTTCAGATA GTAGCCATAT 1320 

GCACTAATGG CTTATATGGA AAATACAGCG ACCAACTGAT TGTCGACATG CCTACTGATA 13 80 

ATCCTGAACT TGATCTTTTC CCTGAATTAA TTGGAACTGA AGAAATAATC AAGGAGGAGG 1440 

AAGAGGGAAA AGACATTGAA GAAGGCGCTA TTGTGAATCC TGGTAGAGAC AGTGCTACAA 1500 

ACCAAATCAG GAAAAAGGAA CCCCAGATTT CTACCACAAC ACACTACAAT CGCATAGGGA 1560 

CGAAATACAA TGAAGCCAAG ACTAACCGAT CCCCAACAAG AGGAAGTGAA TTCTCTGGAA 1620 

AGGGTGATGT TCCCAATACA TCTTTAAATT CCACTTCCCA ACCAGTCACT AAATTAGCCA 1680 

CAGAAAAAGA TATTTCCTTG ACTTCTCAGA CTGTG ACT G A ACTGCCACCT CACACTGTGG 1740 

AAGGTACTTC AGCCTCTTTA AATGATGGCT CTAAAACTGT TCTTAGATCT CCACATATGA 1800 

ACTTGTCGGG GACTGCAGAA TCCTTAAATA CAGTTT CTAT AACAGAATAT GAGGAGGAGA 1860 

GTTTATTGAC CAGTTTCAAG CTTGATACTG GAGCTGAAGA TTCTT CAGGC TCCAGTCCCG 1920 

CAACTTCTGC TATCCCATTC ATCTCTGAGA ACATATCCCA AGGGTATATA TTTTCCTCCG 1980 

AAAACCCAGA GACAATAACA TATGATGT CC TTATACCAGA AT CTGCTAGA AATGCTTCCG 2040 

AAGATTCAAC TTCATCAGGT TCAGAAGAAT CACTAAAGGA TCCTTCTATG GAGGGAAATG 2100 

TGTGGTTTCC TAGCTCTACA GACATAACAG CACAGCCCGA TGTTGG AT CA GGCAGAGAGA 2160 

GCTTTCTCCA GACTAATTAC ACTGAGATAC GTGTTGATGA ATCTGAGAAG ACAACCAAGT 2220 

CCTTTTCTGC AGGCCCAGTG ATGTCACAGG GTCCCTCAGT TACAGATCTG GAAATGCCAC 22 80 
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ATTATTCTAC CTTTGCCTAC 
CCAGACAACA GGATTTGGTC 
TATACAATGA GGCCAGTAAT 
AATCCGAGAA GAAGGCAGTT 
TAGTGGTTCT TGTGGGTATT 
ACTTAGAGGA CAGTACATCC 
TTT CAGATG A TGTCGGAGCA 
ATGCAAGTAG TGGGTTTACT 
AGAGCTGTAC TGTTGACTTA 
ACAAGAATCG ATACATAAAT 
TTGCTGAAAA GGATGGCAAA 
ACAGACCAAA AGCTT AT AT T 
GGAGAATGAT ATGGGAACAT 
AAGGAAGGAG AAAATGTGAT 
TTCTGGTCAC TCAGAAGAGT 
TAAGAAACAC AAAAATAAAA 
CACAGT AT CA CTACACGCAG 
TGACCTTTGT GAGAAAGGCA 
ACTGCAGTGC TGGAGTTGGA 
AGATTCAACA CGAAGGAACT 
GAAATTATTT GGTACAAACT 
CCATACTTAG TAAAGAAACT 
TCCTCATTCC TGGACCAGCA 
AGTCAAATAT ACAGCAGAGT 
ATCGAACTTC TTCTATCATC 
GAGAAGGCAC AGACTACATC 
- TCATCATTAC CCAGCACCCT 
ACCATAATGC CCAACTGGTG 
TTGTTTACTG GCCAAATAAA 
TGGCTGAAGA ACACAAATGT 
TAGAAGCTAC ACAGGATGAT 
CAAATCCAGA TAGCCCCATT 
CTGCCAATAG GGATGGGCCT 
CTTTCTGTGC TCTGACAACC 
ACCAGGTAGC CAAGATGATC 
ATCAGTTTCT CTACAAAGTG 
CCACCTCTCT GGACAGTAAT 
AGTCTTTAGT TTAACACAGA 
TCCTAAAATT AGGCAGGAAA 
ACAGTAACTT TCATGACATA 
TTTTTGCAAG ACTTGTAATT 
ATTTCTAAGA ATGGAATTGT 
TTATAGAGGT TAGGAATTCC 
CTGTATTTGT AGCAATT AT C 
AATAAAACAC TCTTCCATAT 
GAAATAATCT GTTACTTATT 
TTATAATTGT AGATTTTTAT 
TTTAGTTTAA TGACGTAGTT 
TGTGTTACCT AAGTCATTAA 
AAATACCTTC ATTTTGAAAG 
ATGGTTTTTA T CCAAGGAAT 
AAAAAAAAAA AAAAAAAAAA 
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TTCCCAACTG 
TCCACGGTCA 
AGTAGCCATG 
ATACCCCTTG 
CTCATCTACT 
CCTAGAGTTA 
ATTCCAATAA 
GAAGAATTTG 
GGTATTACAG 
ATCGTTGCCT 
CTGACTGATT 
GCTGCCCAAG 
AATGTGGAAG 
CAGTACTGGC 
GTGCAAGTGC 
AAGGGCTCCC 
TGGCCTGACA 
GCCTATGCCA 
AGAACAGGCA 
GTCAACATAT 
GAGGAGCAAT 
GAGGTGCTGG 
GGCAAAACAA 
GACTATTCTG 
CCTGTGGAAA 
AATGCCTCCT 
CTCCTTCATA 
GTTATGATTC 
GATGAGCCTA 
CTATCTAATG 
TATGTACTTG 
AGTAAAACTT 
ATGATTGTTC 
CTTATGCACC 
AATCTGATGA 
ATCCTCAGCC 
GGTGCAGCAT 
AAGGGGTGGG 
ATCAGTCTAG 
GGATTCTGCC 
TACTTATTAT 
GGTATTTTTT 
AAACTACAGA 
AGGTTTGCTA 
GATATTCAAC 
GTAAATACTG 
ATTTTACTAC 
CATTAGCTGG 
CTTTGTTTCA 
AAGTTTTTAT 
TGCAAAAATA 
AAA 



AGGTAACACC 
ACGTGGTATA 
AGT CTCGTAT 
TGATCGTGTC 
GGAGGAAATG 
TATCCACACC 
AGCACTTTCC 
AGACACTGAA 
CAGACAGCTC 
ATGATCATAG 
ATATCAATGC 
GCCCACTGAA 
TTATTGTCAT 
CTGCCGATGG 
TTGCCTATTA 
AGAAAGGAAG 
TGGGAGTACC 
AGCGCCATGC 
CATATATTGT 
TTGGCTTCTT 
ATGTCTTCAT 
ACAGTCATAT 
AGCTAGAGAA 
CAGCCCTAAA 
GAT CAAGGGT 
ATATCATGGG 
CCAT CAAGGA 
CTGATGGCCA 
TAAATTGTGA 
AGGAAAAACT 
AAGTGAGGCA 
TTGAACTTAT 
ATGATGAGCA 
AACTAGAAAA 
GGCCAGGAGT 
TTGTGAGCAC 
TGCCTGATGG 
GGGACT CACA 
TTCTGTTATC 
GCCAAATTTA 
GTTTGAACTA 
TCTGTATTGA 
AAATGTTTGT 
GAAATATAAC 
ATTTTACAAC 
CCCTAGTGTC 
TGAGTCAAGT 
TCTTACTCTA 
GCATGTAATT 
GAGAATAACA 
AATATAAATA 



TCATGCTTTT 
CTCGCAGACA 
TGGTCTAGCT 
AGCCCTGACT 
CTTCCAGACT 
TCCAACACCT 
AAAGCATGTT 
AGAGT TTTAC 
CAACCACCCA 
CAGGGTTAAG 
CAATTATGTT 
ATCCACAGCT 
GATAACAAAC 
GAGTGAGGAG 
TACTGTGAGG 
ACCCAGTGGA 
AGAGTACTCC 
AGTGGGGCCT 
GCTAGACAGT 
AAAACACATC 
TCATGATACA 
TCATGCCTAT 
ACAATT CCAG 
GCAATGCAAC 
TGGCATTTCA 
CTATTACCAG 
TTTCTGGAGG 
AAACATGGCA 
GAGCTTTAAG 
TATAATTCAG 
CTTTCAGTGT 
AAGTGTTATA 
TGGAGGAGTG 
AGAAAATTCC 
CTTTGCTGAC 
AAGGCAGGAA 
AAATATAGCT 
TCTGAGCATT 
TGTTGATTTC 
TATCATTAAC 
AAATGATTGA 
TTTTAACAGA 
TTTTAGTGTC 
TTTTAATACA 
TGCAGTATTC 
TCCATGGACC 
TTTCTAGTTC 
CCAGTTTTCT 
TTAACTTTTG 
CCTTACCAAA 
TTGCCATTAA 



ACCCCATCCT 2340 

ACCCAACCGG 2400 

GAGGGGTTGG 2460 

TTTATCTGTC 252 0 

GCACACTTTT 2580 

ATCTTTCCAA 2640 

GCAGATTTAC 2 700 

CAGGAAGTGC 2760 

GACAACAAGC 282 0 

CTAGCACAGC 2 880 

GATGGCTACA 2940 

GAAGATTTCT 3000 

CTCGTGGAGA 3060 

TACGGGAACT 3120 

AATTTTACTC 3180 

CGTGTGGTCA 3240 

CTGCCAGTGC 3300 

GTTGTCGTCC 3360 

ATGTTGCAGC 3 420 

CGTTCACAAA 3480 

CTGGTTGAGG 3540 

GTTAATGCAC 3 60 0 

CTCCTGAGCC 3 660 

AGGGAAAAGA 372 0 

TCCCTGAGTG 3780 

AGCAATGAAT 3840 

ATGATATGGG 3900 

GAAGATGAAT 3960 

GTCACTCTTA 4020 

GACTTTATCT 4080 

CCTAAATGGC 4140 

AAAGAAGAAG 4200 

ACGGCAGGAA 4260 

GTGGATGTTT 4320 

ATTGAGCAGT 4380 

GAGAATCCAT 4440 

GAGAGCTTAG 4500 

GTTTTCCTCT 4560 

CCATCACCTG 4620 

AATGTGTGCC 4680 

ATTTTACAGT 4740 

AAATTTCAAT 4800 

AAATTTTTAG 4860 

GTAGCCTGTA 4 920 

ACCTAAAGTA 4 980 

AAATTTATAT 5040 

TGTGTAATTG 5100 

GACATTGTAT 5160 

TGGAAAATAG 5220 

CATTGTTCAA 52 80 

AAAAAAAAAA 5340 



Seq ID NO: 57 9 Protein sequence: 
55 Protein Accession #: EOS sequence 
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MVFKASKITF 
LSILFEVGTE 
PCTDTVDWIV 
SYTGKEEIHE 
TKHEFLTDGY 
PELIGTEEII 
TNRSPTRGSE 
NDGSKTVLRS 
ISENISQGYI 
DITAQPDVGS 
FPTEVTPHAF 
IPLVIVSALT 
IPIKHFPKHV 
IVAYDHSRVK 
NVEVIVMITN 
KGSQKGRPSG 
RTGTYIVLDS 
EVLDSHIHAY 
PVERSRVGIS 
VMIPDGQNMA 
YVLE VRHFQ C 
LMHQLEKENS 
GAALPDGN I A 



HWGKCNMSSD 

ENLDFKAIID 

FKDTVSISES 

AVCSSEPENV 

QDLGAILNNL 

KEEEEGKDIE 

FSGKGDVPNT 

PHMNLSGTAE 

FSSENPETIT 

GRESFLQTNY 

TPSSRQQDLV 

FICLWLVGI 

ADLHASSGFT 

LAQLAEKDGK 

LVE KGRRKCD 

RWTQYHYTQ 

MLQQIQHEGT 

VNALLIPGPA 

SLSGEGTDYI 

EDEFVYWPNK* 

PKWPNPDSPI 

VDVYQ VAKM I 

ESLESLV 



21 
I 

GSEHSLEGQK 
GVESVSRFGK 
QLAVFCEVLT 
QADPENYTSL 
LPNMSYVLQI 
EGAIVNPGRD 
SLNSTSQPVT 
SLNTVSITEY 
YDVLIPESAR 
TEIRVDESEK 
STVNWYSQT 
LIYWRKCFQT 
EEFETLKEFY 
LTDYINANYV 
QYWPADGSEE 
WPDMGVPEYS 
VNIFGFLKHI 
GKTKLEKQFQ 
NASYIMGYYQ 
DEPINCESFK 
SKTFELISVI 
NLMRPGVFAD 



31 
I 

FPLEMQIYCF 
QAALDPFILL 
MQQSGYVMLM 
LVTWERPRW 
VAI CTNGLYG 
SATNQIRKKE 
KLATEKD I Sh 
EEESLLTSFK 
NASEDSTSSG 
TTKSFSAGPV 
TQPVYNEASN 
AHFYLEDSTS 
QEVQSCTVDL 
D GYNRPKAY I 
YGNFLVTQKS 
LPVLTFVRKA 
RSQRNYLVQT 
LLSQSNIQQS 
SNEFIITQHP 
VTLMAEEHKC 
KEEAANRDGP 
IEQYQFLYKV 



41 



DADRFSSFEE 
NLLPNSTDKY 
DYLQNNFREQ 
YDTMIEKFAV 
KYSDQLIVDM 
PQISTTTHYN 
TSQTVTELPP 
LDTGAEDSSG 
SEESLKDPSM 
MSQGPSVTDL 
SSHESRIGLA 
PRVISTPPTP 
GITADSSNHP 
AAQGPLKSTA 
VQVLAYYTVR 
AYAKRHAVGP 
EEQYVFIHDT 
DYSAALKQCN 
LLHTIKDFWR 
LSNEEKLIIQ 
MIVHDEHGGV 
ILSLVSTRQE 



51 
I 

AVKGKGKLRA 60 

YIYNGSLTSP 120 

QYKFSRQVFS 180 

LYQQLDGEDQ 240 

PTDNPELDLF 300 

R I GTKYNEAK 360 

HTVEGTSASL 420 

SSPATSAIPF 480 

EGNVWFPSST 540 

EMPHYSTFAY 600 

EGLESEKKAV 660 

IFPISDDVGA 720 

DNKHKNRYIN 780 

EDFWRMIWEH 840 

NFTLRNTKIK 900 

VWHCSAGVG 960 

LVEAILSKET 1020 

REKNRTSSII 1080 

MIWDHNAQLV 1140 

DFILEATQDD 1200 

TAGTFCALTT 1260 

ENPSTSLDSN 1320 



85 



Seq ID NO: 580 DNA sequence 
Nucleic Acid Accession #: EOS 
Coding sequence: 148-4632 
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WO 02/086443 

1 I 

CACACATACG CACGCACGAT 
CAAAAAAAAC ATTTCCTTCG 
CGGCGAGGGG CCGCAGACCG 
CAGCTCCTCT GTGTTTGCCG 
CTTGTTGAAG AGATTGGCTG 
AAATATCCAA CATGTAATAG 
CAAGTAAATG TGAATCTTAA 
AACACATT CA TT CAT AACAC 
GTCAGCGGAG GAGTTTCAGA 
AAATGCAATA TGTCATCTGA 
GAGATGCAAA TCTACTGCTT 
GGAAAAGGGA AGTTAAGAGC 
GATTTCAAAG CGATTATTGA 
TTAGATCCAT TCATACTGTT 
AATGGCT CAT TGACATCTCC 
ACAGTTAGCA TCTCTGAAAG 
TCTGGTTATG TCATGCTGAT 
TTCTCTAGAC AGGTGTTTTC 
AGTTCAGAAC CAGAAAATGT 
TGGGAAAGAC CTCGAGTCGT 
CAGTTGGATG GAGAGGACCA 
GGTGCTATTC TCAATAAT TT 
TGCACTAATG GCTTATATGG 
AATCCTGAAC TTGATCTTTT 
GAAGAGGGAA AAGACATTGA 
AACCAAATCA GGAAAAAGGA 
ACGAAATACA ATGAAGCCAA 
AAGGGTGATG TTCCCAATAC 
ACAGAAAAAG ATATTTCCTT 
GAAGGTACTT CAGCCTCTTT 
AACTTGTCGG GGACTGCAGA 
AGTTTATTGA CCAGTTTCAA 
GCAACTTCTG CTATCCCATT 
GAAAACCCAG AGACAATAAC 
GAAGATT CAA CTTCATCAGG 
GTGTGGTTTC CTAGCTCTAC 
AGCTTTCTCC AGACTAATTA 
TCCTTTTCTG CAGGCCCAGT 
CATTATTCTA CCTTTGCCTA 
TCCAGACAAC AGGATTTGGT 
GTATACAATG AGGCCAGTAA 
GAATCCGAGA AGAAGGCAGT 
CTAGTGGTTC TTGTGGGTAT 
TACTTAGAGG ACAGTACATC 
ATTTCAGATG ATGTCGGAGC 
CATGCAAGTA GTGGGTTTAC 
CAGAGCTGTA CTGTTGACTT 
CACAAGAATC GATACATAAA 
CTTGCTGAAA AGGATGGCAA 
AACAGACCAA AAGCTTATAT 
TGGAGAATGA TATGGGAACA 
AAAGGAAGGA GAAAATGTGA 
TTTCTGGTCA CTCAGAAGAG 
CTAAGAAACA CAAAAATAAA 
ACACAGT AT C ACTACACGCA 
CTGACCTTTG TGAGAAAGGC 
CACTGCAGTG CTGGAGTTGG 
CAGATTCAAC ACGAAGGAAC 
AGAAATTATT TGGTACAAAC 
GCCATACTTA GTAAAGAAAC 
CTCCTCATTC CTGGACCAGC 
CTGTCACCCA GGCTGGAGTG 
GGCTTAACTG ATCCTCCTAC 
TCAAATATAC AGCAGAGTGA 
CGAACTTCTT CTATCATCCC 
GAAGG CACAG ACTACAT CAA 
ATCATTACCC AGCACCCTCT 
CATAATGCCC AACTGGTGGT 
GTTTACTGGC CAAATAAAGA 
GCTGAAGAAC ACAAATGTCT 
GAAGCTACAC AGGATGATTA 
AATCCAGATA GCCCCATTAG 
GCCAATAGGG ATGGGCCTAT 
TTCTGTGCTC TGACAACCCT 
CAGGTAGCCA AGATGATCAA 
CAGTTTCTCT ACAAAGTGAT 
ACCTCTCTGG ACAGTAATGG 
TCTTTAGTTT AACACAGAAA 
CTAAAATTAG GCAGGAAAAT 
AGTAACTTTC ATGACATAGG 
TTTGCAAGAC TTGTAATTTA 
TT CTAAGAAT GGAATTGTGG 
ATAGAGGTTA GGAATT CCAA 
GTATTTGTAG CAATTAT CAG 
TAAAACACTC TT CCATATGA 
AATAATCTGT TACTTATTGT 
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I 

CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 
TGGGAAAACA 
AATGGTGTTT 
TGGATCAGAG 
TGATGCGGAC 
TTTATCCATT 
TGGAGTCGAA 
GAACCTTCTG 
TCCCTGCACA 
CCAGTTGGCT 
GGACTACTTA 
CTCATACACT 
TCAGGCTGAC 
TTATGATACC 
AACCAAGCAT 
GCTACCCAAT 
AAAAT AC AG C 
CCCTGAATTA 
AGAAGGCGCT 
ACCCCAGATT 
GACTAACCGA 
ATCTTTAAAT 
GACTTCTCAG 
AAATGATGGC 
ATCCTTAAAT 
GCTTGATACT 
CATCTCTGAG 
ATATGATGTC 
TTCAGAAGAA 
AGACATAACA 
CACTGAGATA 
G ATGT CACAG 
CTTCCCAACT 
CTCCACGGTC 
TAGTAGCCAT 
TATACCCCTT 
TCTCATCTAC 
CCCTAGAGTT 
AATTCCAATA 
TGAAGAATTT 
AGGTATTACA 
TATCGTTGCC 
ACTGACTGAT 
TGCTGCCCAA 
TAATGTGGAA 
TCAGTACTGG 
TGTGCAAGTG 
AAAGGGCTCC 
GTGGCCTGAC 
AGCCTATGCC 
AAGAACAGGC 
TGTCAACATA 
TGAGGAGCAA 
TGAGGTGCTG 
AGGCAAAACA 
CAGAGGCACA 
CTCAGCCTCC 
CTATTCTGCA 
TGTGGAAAGA 
TGCCTCCTAT 
CCTTCATACC 
TATGATTCCT 
TGAGCCTATA 
ATCTAATGAG 
TGTACTTGAA 
TAAAACTTTT 
GATTGTTCAT 
TATGCACCAA 
TCTGATGAGG 
CCTCAGCCTT 
TGCAGCATTG 
GGGGTGGGGG 
CAGTCTAGTT 
ATTCTGCCGC 
CTTATTATGT 
TATTTTTTTC 
ACTACAGAAA 
GTTTGCTAGA 
TATTCAACAT 
AAATACTGCC 



TCTATACACT 

CTCTCCACTC 

CGAATCCTAA 

GCTAATGGAT 

GG AG CACTG A 

TCTCCTATCA 

TTTCAGGGTT 

GTGGAAATTA 

AAAGCAAGCA 

CATAGTTTAG 

CGATTTTCAA 

TTGTTTGAGG 

AGTGTTAGTC 

CCAAACTCAA 

GACACAGTTG 

GTTTTTTGTG 

CAAAACAATT 

GGAAAGGAAG 

CCAGAGAATT 

ATGATTGAGA 

GAATTTTTGA 

ATGAGTTATG 

GACCAACTGA 

ATTGGAACTG 

ATTGTGAATC 

TCTACCACAA 

TCCCCAACAA 

TCCACTTCCC 

ACTGTGACTG 

TCTAAAACTG 

ACAGTTTCTA 

GGAGCTGAAG 

AACATATCCC 

CTTATACCAG 

TCACTAAAGG 

GCACAGCCCG 

CGTGTTGATG 

GGTCCCTCAG 

GAGGTAACAC 

AACGTGGTAT 

GAGTCTCGTA 

GTGATCGTGT 

TGGAGGAAAT 

ATATCCACAC 

AAGCACTTTC 

GAGACACTGA 

GCAGACAGCT 

TATGATCATA 

TATATCAATG 

GGCCCACTGA 

GTTATTGTCA 

CCTGCCGATG 

CTTGCCTATT 

CAGAAAGGAA 

ATGGGAGTAC 

AAGCGCCATG 

ACATATATTG 

TTTGGCTTCT 

TATGTCTTCA 

GACAGTCATA 

AAGCTAGAGA 

ATCTCGGCTC 

CGAGTGGCTG 

GCCCTAAAGC 

TCAAGGGTTG 

ATCATGGGCT 

ATCAAGGATT 

GATGGCCAAA 

AATTGTGAGA 

GAAAAACTTA 

GTGAGGCACT 

GAACTTATAA 

GATGAGCATG 

CTAGAAAAAG 

CCAGGAGTCT 

GTGGGCACAA 

CCTGATGGAA 

GACTCACATC 

CTGTTATCTG 

CAAATTTATA 

TTGAACTAAA 

TGTATTGATT 

ATGTTTGTTT 

AATATAACTT 

TTTACAACTG 

CTAGTGTCTC 



GGAGGATTAA 
TGAGAAGCAG 
AACGTTTCCT 
ACTACAGACA 
ATCAAAAAAA 
ATATTGATGA 
GGGATAAAAC 
ATCTCACTAA 
AGATAACTTT 
AAGGACAAAA 
GTTTTGAGGA 
TTGGGACAGA 
GTTTTGGGAA 
CTGACAAGTA 
ACTGGATTGT 
AAGTTCTTAC 
TT CGAGAGCA 
AGATTCATGA 
ATACCAG CCT 
AGTTTGCAGT 
CAGATGGCTA 
TTCTTCAGAT 
TTGTCGACAT 
AAGAAATAAT 
CTGGTAGAGA 
CACACTACAA 
GAGGAAGTGA 
AACCAGTCAC 
AACTGCCACC 
TTCTTAGATC 
TAACAGAATA 
ATTCTTCAGG 
AAGGGTATAT 
AATCTGCTAG 
ATCCTTCTAT 
ATGTTGGATC 
AATCTGAGAA 
TTACAGATCT 
CTCATGCTTT 
ACTCGCAGAC 
TTGGTCTAGC 
CAGCCCTGAC 
GCTTCCAGAC 
CTCCAACACC 
CAAAGCATGT 
AAGAGTTTTA 
CCAACCACCC 
GCAGGGTTAA 
CCAATTATGT 
AATCCACAGC 
TGATAACAAA 
GGAGTGAGGA 
ATACTGTGAG 
GACCCAGTGG 
CAGAGTACTC 
CAGTGGGGCC 
TGCTAGACAG 
TAAAACACAT 
TTCATGATAC 
TTCATGCCTA 
AACAATTCCA 
ACTGCAACCT 
GGACTATACT 
AATGCAACAG 
GCATTTCATC 
ATTACCAGAG 
TCTGGAGGAT 
ACATGGCAGA 
GCTTTAAGGT 
TAATTCAGGA 
TTCAGTGTCC 
GTGTTATAAA 
GAGGAGTGAC 
AAAATTCCGT 
TTGCTGACAT 
GGCAGGAAGA 
ATATAGCTGA 
TGAGCATTGT 
TTGATTTCCC 
TCATTAACAA 
ATGATTGAAT 
TTAACAGAAA 
TTAGTGTCAA 
TTAATACAGT 
CAGTATTCAC 
CATGGACCAA 



AACAAACAAA 60 

AGGAGCCGCA 120 

CGCTTGCATT 180 

ACAGAGAAAA 240 

TTGGGGAAAG 300 

AGATCTTACA 3 60 

AT CATTGGAA 420 

TGACTACCGT 480 

T CACTGGGG A 540 

ATTTCCACTT 600 

AGCAGTCAAA 660 

AGAAAATTTG 720 

GCAGGCTGCT 780 

TTACATTTAC 840 

TTTTAAAGAT 900 

AATGCAACAA 960 

ACAGTACAAG 1020 

AGCAGTTTGT 1080 

TCTTGTTACA 1140 

TTTGTACCAG 1200 

TCAAGACTTG 12 60 

AGTAGCCATA 1320 

GCCTACTGAT 13 80 

CAAGGAGGAG 1440 

CAGTGCTACA 150 0 

TCGCATAGGG 1560 

ATTCTCTGGA 1620 

TAAATTAGCC 1680 

TCACACTGTG 1740 

TCCACATATG 1800 

TGAGGAGGAG 1860 

CTCCAGTCCC 1920 

ATTTTCCTCC 1980 

AAATGCTTCC 2040 

GGAGGGAAAT 2100 

AGGCAGAGAG 2160 

GACAACCAAG 2220 

GGAAATGCCA 22 80 

TACCCCATCC 2340 

AACCCAACCG 2400 

TGAGGGGTTG 2460 

TTTTATCTGT 2520 

TGCACACTTT 2580 

TATCTTTCCA 2640 

TGCAGATTTA 2700 

CCAGGAAGTG 2760 

AGACAACAAG 2 820 

GCTAGCACAG 2 880 

TGATGGCTAC 2940 

TGAAGATTTC 3000 

CCTCGTGGAG 3 060 

GTACGGGAAC 3120 

GAATTTTACT 3180 

ACGTGTGGTC 3240 

CCTGCCAGTG 3300 

TGTTGTCGTC 3360 

TATGTTGCAG 3420 

CCGTTCACAA 3 480 

ACTGGTTGAG 3 540 

TGTTAATGCA 3600 

GGGTCTCACT 3660 

TCCTCTCCCT 372 0 

CCTGAGCCAG 3780 

GGAAAAG AAT 3840 

CCTGAGTGGA 3900 

CAATGAATTC 3 960 

GATATGGGAC 4020 

AGATGAATTT 40 80 

CACTCTTATG 4140 

CTTTATCTTA 4200 

TAAATGGCCA 4260 

AGAAGAAGCT 4320 

GGCAGGAACT 4380 

GGATGTTTAC 4440 

TG AG CAGT AT 4500 

GAAT CCATCC 4560 

GAGCTTAGAG 4620 

TTTCCTCTTC 4680 

ATCACCTGAC 4 740 

TGTGTGCCTT 4800 

TT TACAGT AT 4860 

ATTTCAATTT 4 920 

ATTTTTAGCT 4 980 

AGCCTGTAAA 5040 

CTAAAGTAGA 5100 

ATTTATATTT 5160 
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ATAATTGTAG ATTTTTATAT 
TAGTTTAATG ACGTAGTTCA 
TGTTACCTAA GTCATTAACT 
ATACCTTCAT TTTGAAAGAA 
GGTTTTTATC CAAGGAATTG 
AAAAAAAAAA AAAAAAAAAA 



TTTACTACTG 
TTAGCTGGTC 
TTGTTTCAGC 
GTTTTTATGA 
CAAAAATAAA 
A 



AGTCAAGTTT 
TTACTCTACC 
ATGTAATTTT 
GAATAACACC 
TATAAATATT 



Seq ID NO: 581 Protein sequence: 
Protein Accession # : EOS sequence 



11 



21 



MRILKRFLAC 
QSPINIDEDL 
FKASKITFHW 
ILFEVGTEEN 
TDTVDWIVFK 
TGKEEIHEAV 
HEFLTDGYQD 
LIGTEEIIKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
LVIVSALTF1 
IKHFPKHVAD 
AYDHSRVKLA 
EVIVMITNLV 
SQKGRPSGRV 
GTYIVLDSML 
LDSHIHAYVN 
SRVAGTILLS 
YIMGYYQSNE 
INCESFKVTL 
FELISVIKEE 
RPGVFADIEQ 



IQLLCVCRLD 
TQVNVNLKKL 
GKCNMSSDGS 
LDFKAI idgv 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKDIEEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDLVST 
CLWLVGILI 
LHASSGFTEE 
QLAEKDGKLT 
EKGRRKCDQY 
VTQYHYTQWP 
QQIQHEGTVN 
ALLIPGPAGK 
QSNIQQSDYS 
FIITQHPLLH 
MAEEHKCLSN 
AANRDGPMIV 
YQFLYKVILS 



WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLLV 
NMSYVLQIVA 
AIVNPGRDSA 
NSTSQPVTKL 
NTVSITEYEE 
VLIPESARNA 
IRVDESEKTT 
VNWYSQTTQ 
YWRKCFQTAH 
FETLKEFYQE 
DYINANYVDG 
WPADGSEEYG 
DMGVPEYSLP 
IFGFLKHIRS 
TKLEKQFQGL 
AALKQCNREK 
TIKDFWRMIW 
EEKLIIQDFI 
HDEHGGVTAG 
LVGTRQEENP 



31 
I 

KLVEEIGWSY 
ENTFIHNTGK 
LEMQIYCFDA 
AIiDPFILLNL 
QSGYVMLMDY 
TWERPRWYD 
ICTNGLYGKY 
TNQIRKKEPQ 
ATEKDISLTS 
EShhTSFKhD 
SEDSTSSGSE 
KSFSAGPVMS 
PVYNEASNSS 
FYLEDSTSPR 
VQSCTVDLGI 
YNRPKAYIAA 
NFLVTQKSVQ 
VLTFVRKAAY 
QRNYLVQTEE 
TLSPRLECRG 
NRTSSIIPVE 
DHNAQLWMI 
LEATQDDYVL 
TFCALTTLMH 
STSLDSNGAA 



Seq ID NO: 582 DNA sequence 

Nucleic Acid Accession #; NM_002851.1 

Coding sequence: 148.. 7092 



85 



1 

1 

CACACATACG 
CAAAAAAAAC 
CGGCGAGGGG 
CAGCTCCTCT 
CTTGTTGAAG 
AAATATCCAA 
CAAGTAAATG 
AACACATTCA 
GT CAGCGGAG 
AAATGCAATA 
GAGATGCAAA 
GGAAAAGGGA 
GATTTCAAAG 
TTAGATCCAT 
AATGG CTCAT 
ACAGTT AG CA 
TCTGGTTATG 
TTCT CTAGAC 
AGTT CAGAAC 
TGGGAAAGAC 
CAGTTGGATG 
GG TG C TAT TC 
TGCACTAATG 
AATCCTGAAC 
GAAGAGGGAA 
AACCAAATCA 
ACGAAATACA 
AAGGGTGATG 
ACAGAAAAAG 
GAAGGTACTT 
AACTTGTCGG 
AGTTTATTGA 
GCAACTTCTG 
GAAAACCCAG 
GAAGATTCAA 
GTGTGGTTTC 
AGCTTTCTCC 
TCCTTTTCTG 
CATTATTCTA 
TCCAGACAAC 
GTATACAATG 
ACCCCTTTGT 



11 
1 

CACGCACGAT 
ATTTCCTTCG 
CCGCAGACCG 
GTGTTTGCCG 
AGATTGGCTG 
CATGTAATAG 
TGAATCTTAA 
TTCATAACAC 
GAGTTTCAGA 
TGTCATCTGA 
TCTACTGCTT 
AGTTAAGAGC 
CGATTATTGA 
TCATACTGTT 
TGACATCTCC 
TCTCTGAAAG 
TCATGCTGAT 
AGGTGTTTTC 
CAGAAAATGT 
CTCGAGTCGT 
GAGAGGACCA 
TCAATAATTT 
GCTTATATGG 
TTGATCTTTT 
AAGACATTGA 
GGAAAAAGGA 
ATGAAGCCAA 
TTCCCAATAC 
ATATTTCCTT 
CAGCCTCTTT 
GGACTGCAGA 
CCAGTTTCAA 
CTATCCCATT 
AGACAATAAC 
CTTCATCAGG 
CTAGCT CTAC 
AGACTAATTA 
CAGGCCCAGT 
CCTTTGCCTA 
AGGATTTGGT 
GTGAGACACC 
TGCTTGACAA 



21 

I 

CTCACTTCGA 
CTCCCCCTCC 
TCTGGAAATG 
CCTGGATTGG 
GTCCTATACA 
CCCAAAACAA 
GAAACTTAAA 
TGGGAAAACA 
AATGGTGTTT 
TGGATCAGAG 
TGATGCGGAC 
TTTATCCATT 
TGGAGT CGAA 
GAACCTTCTG 
TCCCTGCACA 
CCAGTTGGCT 
GGACTACTTA 
CTCATACACT 
TCAGGCTGAC 
TTATGATACC 
AACCAAGCAT 
GCTACCCAAT 
AAAATACAGC 
CCCTGAATTA 
AGAAGGCGCT 
ACCCCAGATT 
GACTAACCGA 
ATCTTTAAAT 
GACTTCTCAG 
AAATGATGGC 
AT CCTTAAAT 
GCTTGATACT 
CATCTCTGAG 
ATATGATGTC 
TTCAGAAGAA 
AGACATAACA 
CACTGAGATA 
GATGTCACAG 
CTTCCCAACT 
CTCCACGGTC 
TCTTCAACCT 
TCAGATCCTC 



31 

I 

TCTATACACT 
CTCTCCACTC 
CGAATCCTAA 
GCTAATGGAT 
GGAGCACTGA 
TCTCCTATCA 
TTTCAGGGTT 
GTGGAAATTA 
AAAGCAAGCA 
CATAGTTTAG 
CGATTTTCAA 
TTGTTTGAGG 
AGTGTTAGTC 
CCAAACTCAA 
GACACAGTTG 
GTTTTTTGTG 
CAAAACAATT 
GGAAAGGAAG 
CCAGAGAATT 
ATGATTGAGA 
GAATTTTTGA 
ATGAGTTATG 
GACCAACTGA 
ATTGGAACTG 
ATTGTGAATC 
TCTACCACAA 
TCCCCAACAA 
TCCACTTCCC 
ACTGTGACTG 
TCTAAAACTG 
ACAGTTTCTA 
GGAGCTGAAG 
AACATAT CCC 
CTTATACCAG 
TCACTAAAGG 
GCACAGCCCG 
CGTGTTGATG 
GGTCCCTCAG 
GAGGTAACAC 
AACGTGGTAT 
TCCTACAGTA 
AACACTACCC 



t c t ti. a*r t c t a 


T HIT A A T Tf^T T 


5220 


AGTTTTCTGA 


CATTGTATTG 


5280 


AACTTTTGTG 


GAAAATAGAA 


5340 


TTACCAAACA 


TTGTTCAAAT 


5400 






J T o u 


41 


51 




i 

TGALNQKNWG 


1 

KKYPTCNSPK 


60 


TVEINLTNDY 


RVSGGVSEMV 


120 


DRFSSFEEAV 


KGKGKLRALS 


180 


LPNSTDKYYI 


YNGSLTSPPC 


240 


LQNNFREQQY 


KFSRQVFSSY 


300 


TMIEKFAVLY 


QQLDGEDQTK 


360 


SDQLIVDMPT 


DNPELDLFPE 


420 


ISTTTHYNRI 


GTKYNEAKTN 


480 


QTVTELPPHT 


VEGTSASLND 


540 


TGAEDSSGSS 


PATSAIPFIS 


600 


ESLKDPSMEG 


NVWFPSSTDI 


660 


QGPSVTDLEM 


PHYSTFAYFP 


720 


HESRIGLAEG 


LESEKKAVIP 


780 


VISTPPTPIF 


PISDDVGAIP 


840 


TADSSNHPDN 


KHKNRYINIV 


900 


QGPLKSTAED 


FWRMIWEHNV 


960 


VLAYYTVRNF 


TLRNTKIKKG 


1020 


AKRHAVGPW 


VHCSAGVGRT 


1080 


QYVFIHDTLV 


EAILSKETEV 


1140 


TISAHCNLPL 


PGIjTDPPTSA 


1200 


RSRVGISSLS 


GEGTDYINAS 


1260 


PDGQNMAEDE 


FVYWPNKDEP 


1320 


EVRHFQCPKW 


PNPDSPISKT 


1380 


QLEKENSVDV 


YQVAKMINLM 


1440 


LPDGNIAESL 


ESLV 




41 


51 




1 

GGAGGATTAA 


I 

AACAAACAAA 


60 


TGAGAAGCAG 


AGGAGCCGCA 


120 


AGCGTTTCCT 


CGCTTGCATT 


180 


ACTACAGACA 


ACAGAGAAAA 


240 


ATCAAAAAAA 


TTGGGGAAAG 


300 


ATATTGATGA 


AGATCTTACA 


360 


GGGATAAAAC 


AT C ATTGGAA 


420 


ATCTCACTAA 


TGACTACCGT 


480 


AGATAACTTT 


TCACTGGGGA 


540 


AAGGACAAAA 


ATTTCCACTT 


600 


GTTTTGAGGA 


AGCAGTCAAA 


660 


TTGGGACAGA 


AGAAAATTTG 


720 


GTTTTGGGAA 


GCAGGCTGCT 


780 


CTGACAAGTA 


TTACATTTAC 


840 


ACTGGATTGT 


TTTTAAAGAT 


900 


AAGTTCTTAC 


AATGCAACAA 


960 


TTCGAGAGCA 


ACAGTACAAG 


1020 


AGATT CATGA 


AGCAGTTTGT 


1080 


ATACCAGCCT 


TCTTGTTACA 


1140 


AGTTTGCAGT 


TTTGTACCAG 


1200 


CAGATGGCTA 


TCAAGACTTG 


1260 


TTCTTCAGAT 


AGTAGCCATA 


1320 


TTGTCGACAT 


GCCTACTGAT 


1380 


AAGAAATAAT 


CAAGGAGGAG 


1440 


CTGGTAGAGA 


CAGTGCTACA 


1500 


CACACTACAA 


TCGCATAGGG 


1560 


GAGGAAGTGA 


ATTCTCTGGA 


1620 


AACCAGTCAC 


TAAATTAGCC 


1680 


AACTGCCACC 


TCACACTGTG 


1740 


TTCTTAGATC 


TCCACATATG 


1800 


TAACAGAATA 


TGAGGAGGAG 


1860 


ATTCTTCAGG 


CTCCAGTCCC 


1920 


AAGGGTATAT 


ATTTTCCTCC 


1980 


AATCTGCTAG 


AAATGCTTCC 


2040 


ATCCTTCTAT 


GGAGGGAAAT 


2100 


ATGTTGGATC 


AGGCAGAGAG 


2160 


AATCTGAGAA 


GACAACCAAG 


2220 


TTACAGATCT 


GGAAATGCCA 


2280 


CTCATGCTTT 


TACCCCATCC 


2340 


ACTCGCAGAC 


AACCCAACCG 


2400 


GTGAAGTCTT 


TCCTCTAGTC 


2460 


CTGCTGCTTC 


AAGTAGTGAT 


2520 



410 
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TCGGCCTTGC ATGCTACGCC TGTATTTCCC 
TCTTCCTATG ATGGTGCACC TTTGCTTCCA 
TTTCGCCATC TGCATACAGT TTCTCAAATC 
GATAAGGTGC CCTTGCATGC TTCTCTGCCA 
5 AGCCTTGCTC AGTATT CTGA TGTGCTGTCC 

TTTGGTAGTG AATCTGGTGT TCTTTATAAA 
AGCAGTGATG CCATGATGCA TGCACGTTCT 
GATAATGAGG GCTCCCAACA CATCTTCACT 
GATTCTGTGG GTGTAACTTA TCAGGGTTCC 

10 CCTAAGTCTT CGTTAATAAC CCCAACTGCA 

GGTGATGGGG AATGGTCTGG AGCCTCTTCT 
GGGCTGACAG CCCTTAACAT TTCTTCACCT 
TCTGTGTTTG GTGATGATAA TAAGGCGCTT 
ACTGAACTGC AAATTCCTTC TTTCAATGAG 

15 CCCAACATGT ATGATAATGT AAATAAGTTG 

ATTTCTAGCA CCAAGGGCAT GTTTCCAGGG 
GATCATGAGA TTAGTCAAGT T C C AG AAAAT 
TCTCAAGCAT CTGGTGACAC TTCGCTTAAA 
TCCTCTGACC CTGCTTCTAG TGAAATGTTA 

20 ACCTCAGCTT CTTTTAGTAC TGAAGTATTG 

GACACCTTGC TTAAAACTGT TCTTCCAGCT 
CCCAAAGTTG ATAAAATTAG TTCTACAATG 
AGTGAAAACA TGCTGCACTC TACATCTGTA 
ATGCACTCTG CTTCACTTCA AGGTTTGACC 

25 GTTTTGTTAA AAAGTGAAAG TTCCCACCAA 

TTGTTCCAAA CGGCCAATTT GGAGATTAAC 
TTTGCTACAC CTGTTTT AT C AATTGATGAA 
CATTCCGATG AAATTTTAAC CTCCACCAAA 
ATT CCAACAG TTGCTTCTGA TACATTTGTA 

30 GGGCATGTTG CCATTACAGC TGTTTCTCCC 

TTGCTGTTTC CTTCTAAGGC AACTTCTGAG 
TTAGTGGGTG GTGGTGAAGA TGGTGACACT 
GATAGTGATG GCTTATCCAT TCATAAGTGT 
GAAAAGGTAA TGAATGATTC AGACACCCAC 

35 ATCTCATACT CACTAT CTG A GAATTCTGAA 

GACAGTCAAA CTGGTATGGA CAGAAGTCCT 
CAAAAGCACA ATGATGGAAA AGAGGAAAAT 
CTCAGCCCTG AATCTAAAGC ATGGGCAGTT 
CAAGGTACCT CAGATAGCCT TAATGAGAAT 

40 ACTAATGAAA AAGATGCTGA TGGGATCCTG 

TTCCCACAGT CCCCAACATC ATCTGTTACT 
GAGGCAGAGG CCAGTAATAG TAGCCATGAG 
TCCGAGAAGA AGGCAGTTAT ACCCCTTGTG 
GTGGTTCTTG TGGGTATTCT CATCTACTGG 

45 TTAGAGGACA GTACATCCCC TAGAGTTATA 

TCAGATGATG TCGGAGCAAT TCCAATAAAG 
GCAAGTAGTG GGTTTACTGA AGAATTTGAG 
AGCTGTACTG TTGACTTAGG TATTACAGCA 
AAGAATCGAT ACATAAATAT CGTTGCCTAT 

50 GCTGAAAAGG ATGGCAAACT GACTGATTAT 

AGACCAAAAG CTTATATTGC TGCCCAAGGC 
AGAATGATAT GGGAACATAA TGTGGAAGTT 
GGAAGGAGAA AATGTGATCA GTACTGGCCT 
CTGGTCACTC AGAAGAGTGT GCAAGTGCTT 

55 AGAAACACAA AAATAAAAAA GGGCTCCCAG 

CAGTATCACT ACACGCAGTG GCCTGACATG 
ACCTTTGTGA GAAAGGCAGC CTATGCCAAG 
TGCAGTGCTG GAGTTGGAAG AACAGGCACA 
ATT CAACACG AAGGAACTGT CAACATATTT 

60 AATTATTTGG TACAAACTGA GGAGCAATAT 

ATACTTAGTA AAGAAACTGA GGTGCTGGAC 
CTCATTCCTG GACCAGCAGG CAAAACAAAG 
TCAAATATAC AGCAGAGTGA CTATTCTGCA 
CGAACTTCTT CTATCATCCC TGTGGAAAGA 

65 GAAGGCACAG ACTACATCAA TGCCTCCTAT 

AT CATT ACCC AGCACCCTCT CCTTCATACC 
CATAATGCCC AACTGGTGGT TATGATTCCT 
GTTTACTGGC CAAATAAAGA TGAGCCTATA 
GCTGAAGAAC ACAAATGTCT AT CT AATGAG 

70 GAAGCTACAC AGGATGATTA TGTACTTGAA 

AATCCAGATA GCCCCATTAG TAAAACTTTT 
GCCAATAGGG ATGGGCCTAT GATTGTTCAT 
TTCTGTGCTC TGACAACCCT TATGCACCAA 
CAGGTAGCCA AGATGATCAA TCTGATGAGG 

75 CAGTTTCTCT ACAAAGTGAT CCTCAGCCTT 

ACCTCTCTGG ACAGTAATGG TGCAGCATTG 
TCTTTAGTTT AACACAGAAA GGGGTGGGGG 
CTAAAATTAG GCAGG AAAAT CAGTCTAGTT 
AGTAACTTTC ATGACATAGG ATTCTGCCGC 

80 TTTGCAAGAC TTGTAATTTA CTTATTATGT 

TTCTAAGAAT GGAATTGTGG TATTTTTTTC 
ATAGAGGTTA GGAATTCCAA ACTACAGAAA 
GTATTTGTAG CAATT AT CAG GTTTGCTAGA 
TAAAACACTC TTCCATATGA TATTCAACAT 

85 AATAAT CTGT TACTTATTGT AAATACTGCC 

ATAATTGTAG ATTTTTATAT TTTACTACTG 
TAGTTTAATG ACGTAGTTCA TTAGCTGGTC 



AGTGTCGATG TGTCATTTGA ATCCATCCTG 2580 

TTTTCCTCTG CTTCCTTCAG TAGTGAATTG 2640 

CTTCCACAAG TTACTTCAGC TACCGAGAGT 2700 

GTGGCTGGGG GTGATTTGCT ATTAGAGCCC 2760 

ACTACTCATG CTGCTTCAGA GACGCTGGAA 2820 

ACGCTTATGT TTTCTCAAGT TGAACCACCC 2 880 

TCAGGGCCTG AACCTTCTTA TGCCTTGTCT 2940 

GTTTCTTACA GTTCTGCAAT ACCTGTGCAT 3 000 

TTATTTAGCG GCCCTAGCCA TATACCAATA 30 60 

TCATTACTGC AGCCTACTCA TGCCCTCTCT 3120 

GATAGTGAAT TTCTTTTACC TGACACAGAT 3180 

GTTTCTGTAG CTGAATTTAC ATATACAACA 3240 

TCTAAAAGTG AAATAATATA TGGAAATGAG 3300 

ATGGTTTACC CTTCTGAAAG CACAGTCATG 33 60 

AATGCGTCTT TACAAGAAAC CTCTGTTTCC 3420 

TCCCTTGCTC ATACCACCAC TAAGGTTTTT 3480 

AACTTTTCAG TTCAACCTAC ACATACTGTC 3540 

CCTGTGCTTA GTGCAAACTC AGAGCCAGCA 3 60 0 

TCTCCTTCAA CTCAGCTCTT ATTTTATGAG 3 660 

CTACAACCTT CCTTTCAGGC TTCTGATGTT 372 0 

GTGCCCAGTG AT CCAAT AT T GGTTGAAACC 3780 

TTGCATCTCA TTGTAT CAAA TTCTGCTTCA 3 840 

CCAGTTTTTG ATGTGTCGCC TACTTCTCAT 3 900 

ATTTCCTATG CAAGTGAGAA ATATGAACCA 3 960 

GTGGTACCTT CTTTGTACAG TAATGATGAG 4 02 0 

CAGGCCCATC CCCCAAAAGG AAGG CATGT A 4080 

CCATTAAATA CACTAATAAA TAAGCTTATA 4140 

AGTTCTGTTA CTGGTAAGGT ATTTGCTGGT 4200 

TCTACTGATC ATTCTGTTCC TATAGGAAAT 4260 

CACAGAGATG GTTCTGTAAC CT CAACAAAG 4320 

CTGAGT CAT A GTGCCAAATC TGATGCCGGT 4380 

GATGATGATG GTGATGATGA TGATGACAGA 4440 

ATGTCATGCT CATCCTATAG AGAATCACAG 4500 

GAAAACAGTC TTATGGATCA G AATAAT CCA 4560 

GAAGATAATA GAGTCACAAG TGTATCCTCA 4620 

GGTAAATCAC CATCAG CAAA TGGGCTATCC 4680 

GACATTCAGA CTGGTAGTGC TCTGCTTCCT 4740 

CTGACAAGTG ATGAAGAAAG TGGATCAGGG 480 0 

GAGACTTCCA CAGATTTCAG TTTTGCAGAC 4860 

GCAGCAGGTG ACTCAGAAAT AACTCCTGGA 4920 

AGCGAGAACT CAGAAGTGTT CCACGTTTCA 4980 

TCTCGTATTG GTCTAGCTGA GGGGTTGGAA 5040 

ATCGTGTCAG CCCTGACTTT TATCTGTCTA 5100 

AGGAAATGCT TCCAGACTGC ACACTTTTAC 5160 

TCCACACCTC CAACACCTAT CTTTCCAATT 5220 

CACTTTCCAA AGCATGTTGC AGATTTACAT 5280 

ACACTGAAAG AGTTTTACCA GGAAGTGCAG 5340 

GACAGCT CCA ACCACCCAGA CAACAAGCAC 5400 

GATCATAGCA GGGTTAAGCT AGCACAGCTT 5460 

ATCAATGCCA ATTATGTTGA TGGCTACAAC 5520 

CCACTGAAAT CCACAGCTGA AGATTTCTGG 5580 

ATTGTCATGA TAACAAACCT CGTGGAGAAA 5 640 

GCCGATGGGA GTGAGGAGTA CGGGAACTTT 5700 

GCCTATTATA CTGTGAGGAA TTTTACTCTA 5760 

AAAGGAAGAC CCAGTGGACG TGTGGT CACA 582 0 

GGAGTACCAG AGTACTCCCT GCCAGTGCTG 5880 

CGCCATGCAG TGGGGCCTGT TGTCGTCCAC 5 940 

TATATTGTGC TAGACAGTAT GTTGCAGCAG 60 00 

GGCTTCTTAA AACACATCCG TTCACAAAGA 6060 

GTCTTCATTC ATGATACACT GGTTGAGGCC 6120 

AGT CATATTC ATGCCTATGT TAATGCACTC 6180 

CTAGAGAAAC AATTCCAGCT CC TG AG C CAG 6240 

GCCCTAAAGC AATGCAACAG GGAAAAGAAT 6300 

TCAAGGGTTG GCATTTCATC CCTGAGTGGA 6360 

ATCATGGGCT ATTACCAGAG CAATGAATTC 6420 

ATCAAGGATT TCTGGAGGAT GATATGGGAC 6480 

GATGGCCAAA ACATGGCAGA AGATGAATTT 6540 

AATTGTGAGA GCTTTAAGGT CACTCTTATG 6600 

GAAAAACTTA TAATTCAGGA CTTTATCTTA 6660 

GTGAGGCACT TTCAGTGTCC TAAATGGCCA 672 0 

GAACTTATAA GTGTTATAAA AGAAGAAGCT 6780 

GATGAGCATG GAGGAGTGAC GGCAGGAACT 6840 

CTAGAAAAAG AAAATTCCGT GGATGTTTAC 6900 

CCAGGAGTCT TTGCTGACAT TGAGCAGTAT 6960 

GTGAGCACAA GGCAGGAAGA GAATCCATCC 7020 

CCTGATGGAA ATATAGCTGA GAGCTTAGAG 7080 

GACTCACATC TGAGCATTGT TTTCCTCTTC 7140 

CTGTTATCTG TTGATTTCCC AT CACCTGAC 7200 

CAAATT TAT A TCATTAACAA TGTGTGCCTT 72 60 

TTGAACTAAA ATGATTGAAT TTTACAGTAT 7320 

TGTATTGATT TTAACAGAAA ATTTCAATTT 7380 

ATGTTTGTTT TTAGTGTCAA ATTTTTAGCT 7440 

AATATAACTT TTAATACAGT AGCCTGTAAA 750 0 

TTTACAACTG CAGTATTCAC CTAAAGTAGA 7560 

CTAGTGTCTC CATGGACCAA ATTTATATTT 7620 

AGT CAAGTTT TCTAGTTCTG TGTAATTGTT 7680 

TTACTCTACC AGTTTTCTGA CATTGTATTG 7740 
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TGTTACCTAA GTCATTAACT TTGTTTCAGC ATGTAATTTT AACTTTTGTG GAAAATAGAA 78 0 0 
ATACCTTCAT TTTGAAAGAA GTTTTTATGA GAATAACACC TTACCAAACA TTGTTCAAAT 7860 
GGTTTTTATC CAAGGAATTG CAAAAATAAA TATAAATATT GCCATTAAAA AAAAAAAAAA 792 0 
AAAAAAAAAA AAAAAAAAAA A 
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Seq ID NO: 583 Protein sequence 
Protein Accession #: NP__002842.1 
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MRILKRFLAC 
QSPINIDEDL 
PKAS KIT FHW 
II/FEVGTEEN 
TDTVDW I VFK 
TGKEEIHEAV 
HEFLTDGYQD 
LIGTEEIIKE 
RSPTRGSEFS 
GSKTVLRSPH 
ENISQGYIFS 
TAQPDVGSGR 
TEVTPHAFTP 
LNTTPAASSS 
ILPQVTSATE 
KTLMFSQVEP 
SLFSGPSHIP 
PVSVAEFTYT 
LNASLQETSV 
KPVLSANSEP 
AVPSDPILVE 
TISYASEKYE 
EPLNTL INKL 
PHRDGSVTST 
CMSCSSYRES 
PGKSPSANGL 
NETSTDFSFA 
ESRIGLAEGL 
ISTPPTPIFP 
ADSSNHPDNK 
GPLKSTAEDF 
LAYYTVRNFT 
KRHAVGPVW 
YVF IHDTLVE 
AALKQCNREK 
TIKDFWRMIW 
EEICLIIQDFI 
HDEHGGVTAG 
LVSTRQEENP 



11 
I 

IQLLCVCRLD 
TQVNVNLKKL 
GKCNMSSDGS 
LDFKAIIDGV 
DTVSISESQL 
CSSEPENVQA 
LGAILNNLLP 
EEEGKDIEEG 
GKGDVPNTSL 
MNLSGTAESL 
SENPETITYD 
ESFLQTNYTE 
SSRQQDLVST 
DSALHATPVF 
SDKVPLHASL 
PSSDAMMHAR 
IPKSSLITPT 
TSVFGDDNKA 
SISSTKGMFP 
ASSDPASSEM 
TPKVDKISST 
PVLLKSESSH 
IHSDEILTST 
KLLFPSKATS 
QEKVMNDSDT 
SQKHNDGKEE 
DTNEKDADGI 
ESEKKAVI PL 
ISDDVGAIPI 
HKNRYINIVA 
WRMIWEHNVE 
LRNTK I KKGS 
HCSAGVGRTG 
AILSKETEVL 
NRTSSIIPVE 
DHNAQLVVMI 
liEATQDDYVL 
TFCALTTLMH 
STSLDSNGAA 



21 

I 

WANGYYRQQR 
KFQGWDKTSL 
EHSLEGQKFP 
ESVSRFGKQA 
AVFCEVLTMQ 
DPENYTSLLV 
NMSYVLQIVA 
AIVNPGRDSA 
NSTSQPVTKL 
NTVSITEYEE 
VLIPESARNA 
IRVDESEKTT 
VNWYSQTTQ 
PSVDVSFESI 
PVAGGDLLLE 
SSGPEPSYAL 
ASLLQPTHAL 
LSKSEIIYGN 
GSLAHTTTKV 
LSPSTQLLFY 
MLHLIVSNSA 
QWPSLYSND 
KSSVTGKVFA 
ELSHSAKSDA 
HENSLMDQNN 
NDIQTGSALL 
LAAGDSEITP 
VIVSALTFIC 
KHFPKHVADL 
YDHSRVKLAQ 
VIVMITNLVE 
QKGRPSGRW 
TYIVLDSMLQ 
DSH I HAYVNA 
RSRVGISSLS 
PDGQNMAEDE 
EVRHFQCPKW 
QLEKENSVDV 
LPDGNIAESL 



31 



KLVEEIGWSY 
ENTF IHNTGK 
LEMQIYCFDA 
ALDPFILLNL 
QSGYVMLMDY 
TWERPRWYD 
ICTNGLYGKY 
TNQIRKKEPQ 
ATEKDISLTS 
ESLLTSFKLD 
SEDSTSSGSE 
KSFSAGPVMS 
PVYNGETPLQ 
LSSYDGAPLL 
PSLAQYSDVL 
SDNEGSQHIF 
SGDGEWSGAS 
ETELQIPSFN 
FDHEISQVPE 
ETSASFSTEV 
SSENMLHSTS 
ELFQTANLEI 
GIPTVASDTF 
GLVGGGEDGD 
PISYSLSENS 
PLSPESKAWA 
GFPQSPTSSV 
LWLVGILIY 
HASSGFTEEF 
LAEKDGKLTD 
KGRRKCDQYW 
TQYHYTQWPD 
QIQHEGTVNI 
LLIPGPAGKT 
GEGTDYINAS 
FVYWPNKDEP 
PNPDSPISKT 
YQVAKMINLM 
ESLV 



41 

TGALNQKNWG 
TVEINLTNDY 
DRFSSFEEAV 
LPNSTDKYYI 
LQNNFREQQY 
TMIEKFAVIiY 
SDQLIVDMPT 
ISTTTHYNRI 
QTVTELPPHT 
TGAEDSSGSS 
ESJjKDPSMEG 
QGPSVTDLEM 
PSYSSEVFPL 
PFSSASFSSE 
STTHAASETL 
TVSYSSAIPV 
SDSEFLLPDT 
EMVYPSESTV 
NNFSVQPTHT 
LLQPSFQASD 
VPVFDVSPTS 
NQAHPPKGRH 
VSTDHSVPIG 
TDDDGDDDDD 
EEDNRVTSVS 
VLTSDEESGS 
TSENSEVFHV 
WRKCFQTAHF 
ETLKEFYQEV 
YINANYVDGY 
PADGSEEYGN 
MGVPEYSLPV 
FGFLKHIRSQ 
KLEKQFQLLS 
YIMGYYQSNE 
INCESFKVTL 
FELISVIKEE 
RPGVFADIEQ 



51 

I 

KKYPTCNSPK 
RVSGGVSEMV 
KGKGKLRALS 
YNGSLTSPPC 
KFSRQVFSSY 
QQLDGEDQTK 
DNPELDLFPE 
GTKYNEAKTN 
VEGTSASLND 
PATSAIPFIS 
NVWFPSSTDI 
PHYSTFAYFP 
VTPLLLDNQI 
LFRHIjHTVSQ 
EFGSESGVLY 
HDSVGVTYQG 
DGLTALNISS 
MPNMYDNVNK 
VSQASGDTSL 
VDTLLKTVLP 
HMHSASLQGL 
VFATPVLSID 
NGHVA I TAVS 
RDSDGLSIHK 
SDSQTGMDRS 
GQGTSDSLNE 
SEAEASNSSH 
YLEDSTSPRV 
QSCTVDLGIT 
NRPKAYIAAQ 
FLVTQKSVQV 
LTFVRKAAYA 
RNYLVQTEEQ 
QSNIQQSDYS 
FIITQHPLLH 
MAEEHKCLSN 
AANRDGPMIV 
YQFLYKVILS 



Seq ID NO: 584 DNA sequence 

Nucleic Acid Accession ft: NM_005688.1 

Coding sequence: 12 6.. 443 9 



85 



CCGGGCAGGT 
AGGGGCGCAG 
AGAAGATGAA 
GTGTGAGGGA 
GGAGAACTCG 
TCTCTCTTGA 
GAAAGTACCA 
ACCCAGTGGA 
CCCGTGTGGC 
ACGAGTCTTC 
AAGTTGGGCC 
TCATCCTGTC 
TCATGGTGAA 
TGTTGTTAGT 
CTTGGGCATT 
TTAAGAAGAT 
TTTGCTCCAA 
GAGGACCCGT 
GCTTCCTGGG 
T C ACAGCAT A 
ATGAAGTTCT 
AGAGTGTTCA 
AGGGTATCAC 
CTGTTCATAT 
TCTTCAATTC 
AAGCCT CAGT 
TAAAGAACAA 
GGGACTCCTC 
ACAAGAGGGC 
AGGCGGTGCT 
CCGAAGAGGA 



11 
i 

GGCTCATGCT 
GAATTCTGAT 
GGATAT CGAC 
GAGAACCAGC 
ACCGT TGGAA 
TGCCTCCATG 
TCATGGCTTG 
CAATG CTGGG 
CCACAAGAAG 
TGACGTGAAC 
AGACGCTGCT 
CATCGTGTGC 
ACACCTCTTG 
GCTGGGCCTC 
GAATTACCGA 
CCTTAAGTTA 
CGATGGGCAG 
TGTTGCCATC 
ATCAGCTGTT 
TTTCAGGAGA 
TACTTACATT 
AAAAATCCGC 
TGTGGGTGTG 
GACCCTGGGC 
CATGACTTTT 
GGCTGTTGAC 
ACCAGCCAGT 
CCACTCCAGT 
TTCCAGGGGC 
GGCAGAGCAG 
AGAAGGCAAG 



21 
I 

CGGGAGCGTG 
GTGAAACTAA 
ATAGGAAAAG 
ACTTCTGGGA 
TGCCAAGATG 
CATTCTCAGC 
AGTGCTCTGA 
CTTTTTTCCT 
GGGGAGCTCT 
TGCAGAAGAC 
TCCCTGCGAA 
CTGATGATCA 
GAGTATACCC 
CTCCTGACGG 
ACCGGTGTCC 
AAGAACATTA 
AGAATGTTTG 
TTAGGCATGA 
TTTATCCTCT 
AAATGCGTGG 
AAATTTATCA 
GAGGAGGAGC 
GCTCCCATTG 
TTCGATCTGA 
GCTTTGAAAG 
AGATTTAAGA 
CCTCACATCA 
ATCCAGAACT 
AAGAAAGAGA 
AAAGGCCACC 
CACATCCACC 



31 



GTTGAGCGGC 
CAGTCTGTGA 
AGTATATCAT 
CGCACAGAGA 
CCTTGGAAAC 
TCAGAATCCT 
AGCCCATCCG 
GTATGACTTT 
CAATGGAAGA 
TAGAGAGACT 
GGGTTGTGTG 
CGCAGCTGGC 
AGGCAACAGA 
AAATCGTGCG 
GCTTGCGGGG 
AAGAGAAATC 
AGGCAGCAGC 
TTTATAATGT 
TTTACCCAGC 
CCGCCACGGA 
AAATGTATGC 
GTCGGATATT 
TGGTGGTGAT 
CAGCAGCACA 
TAACACCGTT 
GTTTGTTTCT 
AGATAGAGAT 
CGCCCAAGCT 
AGGTGAGGCA 
TCCTCCTGGA 
TGGGCCACCT 



41 
I 

TGGCGCGGTT 
GCCCTGGAAC 
CCCCAGTCCT 
CCGTGAAGAT 
AGCAGCCCGA 
GGATGAGGAG 
GACTACTTCC 
TTCGTGGCTT 
CGTGTGGTCT 
GTGGCAAGAA 
GATCTTCTGC 
TGGCTTCAGT 
GTCTAACCTG 
GTCTTGGTCG 
GGCCATCCTA 
CCTGGGTGAG 
CGTTGGCAGC 
AATTATTCTG 
AATGATGTTT 
TGAACGTGTC 
CTGGGTCAAA 
GGAAAAAGCC 
TGCCAGCGTG 
GGCTTTCACA 
TTCAGTAAAG 
AATGGAAGAG 
GAAAAATGCC 
GACCCCCAAA 
GCTGCAGCGC 
CAGTGACGAG 
GCGCTTACAG 



51 
I 

GTCCTGGAGC 
CTCCGCTCAG 
GGGTATAGAA 
TCCAAGTTCA 
GCCGAGGGCC 
CATCCCAAGG 
AAACACCAGC 
TCTTCTCTGG 
CTGTCCAAGC 
GAGCTGAATG 
CGCACCAGGC 
GGACCAGCCT 
CAGT AC AG CT 
CTTGCACTGA 
ACCATGGCAT 
CT CAT CAACA 
CTGCTGGCTG 
GGACCAACAG 
GCATCACGGC 
CAGAAGATGA 
GCATTTTCTC 
GGGTACTTCC 
GTGACCTTCT 
GTGGTGACAG 
TCCCTCTCAG 
GTTCACATGA 
ACCTTGGCAT 
ATGAAAAAAG 
ACTGAGCATC 
CGGCCCAGTC 
AGGACACTGC 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
72 0 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 



412 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



WO 02/086443 

ACAGCAT CGA TCTGGAGATC 
GTGGAAAAAC CTCTCTCATT 
TTG CAATCAG TGGAACCTTG 
TGAGAGACAA CATCCTGTTT 
ACAGCTGCTG CCTGAGGCCT 
GAG AG CG AGG AGCCAACCTG 
TGTATAGTGA CAGGAGCATC 
TGGGCAACCA CATCTT CAAT 
TTGTTACCCA CCAGTTACAG 
GCTGTATTAC GGAAAGAGGC 
CCATTTTTAA TAACCTGTTG 
AAACCAGTGG TTCACAGAAG 
AGGAAAAAGC AGTAAAGCCA 
GTTCAGTGCC CTGGTCAGTA 
TCCTGGTTAT TATGGCCCTT 
GGTTGAGTTA CTGGATCAAG 
CCTCGGTGAG TGACAGCATG 
CCCTCTCCAT GGCAGTCATG 
GCACGCTGCG AGCTTCCTCC 
CTATGAAGTT TTTTGACACG 
TGGATGAAGT TGACGTGCGG 
TGGTGTTCTT CTGTGTGGGA 
GGCCCCTTGT CATCCTCTTT 
TGAAGCGTCT GGACAATATC 
AGGGCCTTGC CACCATCCAC 
AGCTGCTGGA TGACAACCAA 
CTGTGCGGCT GGACCTCATC 
TTATGCACGG GCAGATTCCC 
TAACGGGGCT GTTCCAGTTT 
CGGTGGAGAG GATCAATCAC 
AGAACAAGGC TCCCTCCCCT 
AGATG AGG T A CCGAGAAAAC 
CTAAAGAGAA GATTGGCATT 
CCCTCTTCCG TCTGGTGGAG 
GTGATATTGG CCTTGCCGAC 
TGTTCAGTGG CACTGTCAGA 
TTTGGGATGC CCTGGAGAGG 
TTGAATCTGA AGTGATGGAG 
GCATAGCTAG AGCCCTGCTC 
CCATGGACAC AGAGACAGAC 
GTACCATGCT GACCATTGCC 
TGCTGGCCCA GGGACAGGTG 
GTTCCCGATT CTATGCCATG 
TCCTCCCTGT TGACGAAGTC 
CCCCTCATCG CGTCCTCCTA 
GTTCCGGATT GGCTTGTGTG 
ATTCCATATT CATGTAAACA 
GGGAACCGTT ATTATAATTG 
T CT AT AT AT A ATTCTGTACA 
TAT TAAAATA AGCACTGTGC 
TTGCTGTACT AGAGATCTGG 
CTCTAGCTGG TGGTTTCACG 
ATAGTGGGCG CTCCGACAGC 
GAGACGGGTG GGCGGCTGGA 
CTGTCCTGGT GT CACTT ACT 
TTTCACTCCC TCCATCAAGA 
TTTCCTGCCT TCTTCTTTTT 
TCCCAGTGCC TCAGGTTCCT 
GTTGGTTCCA AGCCCTGGAG 
ATTCCCACAC CTCCACAGTT 
CTCACCGCAG TCGTCGCACA 
CAGCTCTTGC TAATCAGTGT 
ACCTCAGGTT GCTGGTTGCT 
GGGGCTGGTA GCTCAGGTGG 
ATGTCGTGAC CAACTAGACA 
CAAAAATCTG AAAATGTGAA 
AAAAAAAAAA AAAAAAAA 



PCT/US02/12476 



CAAGAGGGTA 
TCAGCCATTT 
GCTTATGTGG 
GGGAAGGAAT 
GACCTGGCCA 
AGCGGTGGGC 
TACATCCTGG 
AGTGCTATCC 
TACCTGGTTG 
ACCCATGAGG 
CTGGGAGAGA 
AAGTCACAAG 
GAGGAAGGGC 
T ATGGTGT CT 
TTCATGCTGA 
CAAGGAAGCG 
AAGGACAATC 
CTGATCCTGA 
CGGCTGCATG 
ACCCCCACAG 
CTGCCGTTCC 
ATGATCGCAG 
TCAGTCCTGC 
ACGCAGTCAC 
GCCTACAATA 
GCTCCTTTTT 
AGCATCGCCC 
CCAGCCTATG 
ACGGTCAGAC 
TACATTAAGA 
GACTGGCCCC 
CTCCCTCTTG 
GTGGGGCGGA 
TT AT CTGGAG 
CT CCGAAGCA 
TCAAATTTGG 
ACACACATGA 
AATGGGGATA 
CGCCACTGTA 
TTATTGATTC 
CATCGCCTGC 
GTGGAGTTTG 
TTTGCTGCTG 
TCTTTTCTTT 
CCGAAACCTT 
TTTCACTTTT 
AAATTTAGTT 
TATCAGAGGC 
TAGCCTATAT 
TAATAACAGT 
TTTTGCTATT 
GTGCCAGGTT 
CCCCTCTGCC 
GACCATGCAG 
GTTTCTGTCA 
ATGGGGATCA 
GCTGTTGTTT 
ATGGCTGGCC 
CCAACTGCTG 
CAGTGGCAGG 
GTCTCTCTCT 
CTCACACTGG 
GTGTGGTTTG 
GCGTGGTCAC 
TTCTGTCGCC 
TAAAATTATT 



AACTGGTTGG 
TAGGCCAGAT 
CCCAGCAGGC 
ATGATGAAGA 
TTCTTCCCAG 
AGCGCCAGAG 
ACGACCCCCT 
GGAAACATCT 
ACTGTGATGA 
AACTGATGAA 
CACCGCCAGT 
ACAAGGGTCC 
AGCTTGTGCA 
ACATCCAGGC 
ATGTAGGCAG 
GGAACACCAC 
CTCATATGCA 
AAGCCATTCG 
ACGAGCTTTT 
GGAGGATTCT 
AGGCCGAGAT 
GAGTCTTCCC 
ACATTGTCTC 
CTTTCCTCTC 
AAGGGCAGGA 
TTTTGTTTAC 
TCATCACCAC 
CGGGTCTCGC 
TGGCATCTGA 
CTCTGTCCTT 
AGGAGGGAGA 
TCCTAAAGAA 
CAGGATCAGG 
GCTGCATCAA 
AACTCTCTAT 
ACCCCTTCAA 
AAGAATGTAT 
ACTTCTCAGT 
AGATTCTGAT 
AAGAGACCAT 
ACACGGTTCT 
ACACCCCATC 
CAGAGAACAA 
AGAGCATTGC 
GCCTTTCTCG 
AGGGAGAGTC 
TTTGTTCTTA 
CTATAATGAA 
TTACAGTGAA 
GCATATTCCT 
AGACTGTAGG 
TTCTGGGTGT 
GCCTCCCCAC 
AGCGCCGTGA 
GGAGAGCAGC 
CAGAGACATT 
CTAAACAAGA 
ACTGCACAGA 
CTTTTTGAGG 
GCTCAGGATT 
CTCTCTCCCC 
CGTAGAAGTT 
GTGTGTTCCC 
TGCTGTCATC 
TTAGCATGTT 
TTGGATTTTG 



AATCTGCGGC 
GACGCTTCTA 
CTGGATCCTC 
AAGATACAAC 
CAGCGACCTG 
GATCAGCCTT 
CAGTGCCTTA 
CAAGTCCAAG 
AGTGATCTTC 
TTTAAATGGT 
TGAGATCAAT 
TAAAACAGGA 
GCTGGAAGAG 
TGCTGGGGGC 
CACCGCCTTC 
TGTGACTCGA 
GTACTATGCC 
AGGAGTTGTC 
CCGAAGGATC 
CAACAGGTTT 
GTTCATCCAG 
GTGGTTCCTT 
CAGGGTCCTG 
CCACATCACG 
GTTTCTGCAC 
GTGTGCGATG 
CACGGGGCTG 
CATCTCTTAT 
GACAGAAGCT 
GGAAGCACCT 
GGTGACCTTT 
AGT AT CCTTC 
GAAGT CCTCG 
GATTGATGGA 
CATTCCTCAA 
CCAGTACACT 
TGCTCAGCTA 
GGGGGAACGG 
TTTAGATGAA 
CCGAGAAGCA 
AGGCTCCGAT 
GGT CCTTCTG 
GGTCGCTGTC 
CATTCCCTGC 
ATTTTATCTT 
ATATTTTGAT 
ATTGCACTCT 
GCTTTATACG 
AATGTAAGCT 
TTCTATCATT 
AAGAGTAGCA 
CCAAAGGAAG 
AGCCGCTCCA 
GTTCTCAGGG 
GGGGCGAAGC 
CCTCCGAGCC 
ATCAGTCTAT 
GCTCTCCAGC 
TGGCACTTTT 
TCGTGGGTCT 
TCAAAGTCTG 
TTTGTACTGT 
GCAAACCCCC 
AGTTGAATGG 
TGCTGAACAC 
TAAAAAAAAA 



AGTGTGGGAA 192 0 

GAGGGCAGCA 1980 

AATGCTACTC 2 040 

TCTGTGCTGA 2100 

ACGGAGATTG 2160 

GCCCGGGCCT 2220 

GATGCCCATG 2280 

ACAGTTCTGT 2340 

ATGAAAGAGG 2400 

GACTATGCTA 2460 

TCAAAAAAGG 252 0 

TCAGTAAAGA 25 80 

AAAGGGCAGG 2640 

CCCTTGGCAT 270 0 

AGCACCTGGT 2 760 

GGGAACGAGA 2 82 0 

AGCATCTACG 2880 

TTTGTCAAGG 2940 

CTT CGAAGCC 3000 

T CCAAAGAC A 3060 

AACGTTATCC 312 0 

GTGGCAGTGG 3180 

ATTCGGGAGC 3240 

TCCAGCATAC 3 3 0 0 

AGATACCAGG 3 3 60 

CGGTGGCTGG 3420 

ATGATCGTTC 3480 

GCTGTCCAGT 3540 

CGATTCACCT 360 0 

GCCAGAATTA 3660 

GAGAACGCAG 3720 

ACGATCAAAC 3780 

CTGGGGATGG 3840 

GTGAGAATCA 3 900 

GAGCCGGTGC 3960 

GAAGACCAGA 4020 

CCTCTGAAAC 40 80 

CAGCTCTTGT 4140 

GCCACAGCTG 4200 

TTTGCAGACT 42 60 

AGGATTATGG 432 0 

TCCAACGACA 43 80 

AAGGGCTGAC 4440 

CTGGGGCGGG 4500 

TCGCACAGCA 4560 

TATTGTATTT 462 0 

AAAAGGTTCA 4680 

TGTAGCTATA 4740 

GTTTATTTTA 4800 

TTTGTACAGT 4 860 

TTTCATTCTT 4 920 

ACGTGTGGCA 4980 

GGGGTGGCTG 5040 

CTCCTGCCTT 5100 

CCAGGCCCCT 5160 

GGGGAGTTTC 5220 

CCACAGAGAG 52 8 0 

TCCAAGACCT 5340 

TCATTTGCCT 5400 

GTTTTCCTTT 54 60 

CAACTTTAAG 5520 

AAAGAGACCT 5580 

TTTGTGCTGT 5640 

TCAGCGTTGC 5700 

CTTGTGGAAG 5760 

AAAAAAAAAA 5820 



Seq ID NO: 585 Protein sequence 
70 Protein Accession #: NP 005679.1 



75 



80 



85 



MKDXDIGKEY 
LDASMHSQLR 
VAHKKGELSM 
LSIVCLMITQ 
ALNYRTGVRL 
PWAILGMIY 
VLTYIKFIKM 
HMTLGFDLTA 
NKPASPHIKI 
VLAEQKGHLL 
KTSLISAILG 
CCLRPDLAIL 
NHIFNSAIRK 
FNNLLLGETP 



11 
! 

IIPSPGYRSV 
ILDEEHPKGK 
EDVWSLSKHE 
LAGFSGPAFM 
RG A I LTMAF K 
NVI ILGPTGF 
YAWVKAFSQS 
AQAFTWTVF 
EMKNATLAWD 
LDSDERPSPE 
QMTLLEGSIA 
PSSDLTEIGE 
HLKSKTVLFV 
PVEINSKKET 



21 
I 

RERTSTSGTH 
YHHGL S ALiKP 
SSDVNCRRLE 
VKHLLEYTQA 
KILKLKNIKE 
LGSAVFILFY 
VQKIREEERR 
NSMTFALKVT 
SSHSSIQNSP 
EEEGKHIHLG 
ISGTFAYVAQ 
RGANLSGGQR 
THQLQYLVDC 
SGSQKKSQDK 



31 
I 

RDREDSKFRR 
IRTTSKHQHP 
RLWQEELNEV 
TESNLQYSLL 
KSLGELINIC 
PAMMFASRLT 
ILEKAGYFQG 
PFSVKSLSEA 
KLTPKMKKDK 
HLRLQRTLHS 
QAWILNATLR 
QRISLARALY 
DEVIFMKEGC 
GPKTGSVKKE 



41 
I 

TRPLECQDAL 
VDNAGLFS CM 
GPDAASLRRV 
LVLGLLLTEI 
SNDGQRMFEA 
AYFRRKCVAA 
ITVGVAPIW 
SVAVDRFKSL 
RASRGKKEKV 
IDLEIQEGKL 
DNILFGKEYD 
SDRSIYILDD 
ITERGTHEEL 
KAVKPEEGQL 



51 
I 

ETAARAEGLS 60 

TFSWLSSLAR 120 

VWIFCRTRLI 180 

VRSWSLALTW 240 

AAVGSLLAGG 300 

TDERVQKMNE 3 60 

VIASWTFSV 420 

FLMEEVHMIK 480 

RQLQRTEHQA 540 

VGICGSVGSG 600 

EERYNSVLNS 660 

PLSALDAHVG 72 0 

MNLNGDYATI 780 

VQLEEKGQGS 840 



1 



413 



WO 02/086443 PCT/US02/12476 

VPWSVYGVYI QAAGGPLAFL VIMALFMLNV GSTAFSTWWL SYWIKQGSGN TTVTRGNETS 900 
VSDSMKDNPH MQYYAS I YAL SMAVMLILKA IRGWFVKGT LRASSRLHDE LFRRILRSPM 960 

KFFDTTPTGR ILNRFSKDMD EVDVRLPFQA EMFIQNVILV FFCVGMIAGV FPWFLVAVGP 1020 

LVILFSVLHI VSRVLIRELK RLDNITQSPF LSHXTSSIQG LATIHAYNKG QEFLHRYQEL 1080 

5 LDDNQAPFFL FTCAMRWLAV RLDLISIALI TTTGLMIVLM HGQIPPAYAG LAISYAVQLT 1140 

GLFQFTVRLA SETEARFTSV ERINHYIKTL SLEAPARIKN KAPSPDWPQE GEVTFENAEM 12 00 

RYRENLPLVL KKVSFTIKPK EKIGIVGRTG SGKSSLGMAL FRXiVELSGGC IKIDGVRISD 1260 

IGLADLRSKL SIIPQEPVLF SGTVRSNLDP FNQYTEDQIW DALERTHMKE CIAQLPLKLE 1320 

SEVMENGDNF SVGERQLLCI ARALLRHCKI LILDEATAAM DTETDLLIQE TIREAFADCT 13 80 
10 MLTIAHRLHT VLGSDRIMVL AQGQWEFDT PSVLLSNDSS RFYAMFAAAE NKVAVKG 



15 



40 



Seq ID NO: 586 DNA sequence 

Nucleic Acid Accession #: NM_001327.1 

Coding sequence: 89.. 631 



11 21 31 41 51 

1 I I I I 

AGCAGGGGGC GCTGTGTGTA CCGAGAATAC GAGAATACCT CGTGGGCCCT GACCTTCTCT 60 

CTGAGAGCCG GGCAGAGGCT CCGGAGCCAT GCAGGCCGAA GGCCGGGGCA CAGGGGGTTC 120 

20 GACGGGCGAT GCTGATGGCC CAGGAGGCCC TGGCATTCCT GATGGCCCAG GGGGCAATGC 180 

TGGCGGCCCA GGAGAGGCGG GTGCCACGGG CGGCAGAGGT CCCCGGGGCG CAGGGGCAGC 240 

AAGGGCCTCG GGGCCGGGAG GAGGCGCCCC GCGGGGTCCG CATGGCGGCG CGGCTTCAGG 3 00 

GCTGAATGGA TGCTGCAGAT GCGGGGCCAG GGGGCCGGAG AGCCGCCTGC TTGAGTTCTA 3 60 

CCTCGCCATG CCTTTCGCGA CACCCATGGA AGCAGAGCTG GCCCGCAGGA GCCTGGCCCA 420 

25 GGATGCCCCA CCGCTTCCCG TGCCAGGGGT GCTTCTGAAG GAGTTCACTG TGTCCGGCAA 480 

CATACTGACT ATCCGACTGA CTGCTGCAGA CCACCGCCAA CTGCAGCTCT CCATCAGCTC 540 

CTGTCTCCAG CAGCTTTCCC TGTTGATGTG GAT CACGCAG TGCTTTCTGC CCGTGT TTTT 600 

GGCTCAGCCT CCCTCAGGGC AGAGGCGCTA AGCCCAGCCT GGCGCCCCTT CCTAGGTCAT 660 

GCCTCCTCCC CTAGGGAATG GTCCCAGCAC GAGTGGCCAG TTCATTGTGG GGGCCTGATT 720 

30 GTTTGTCGCT GGAGGAGGAC GGCTTACATG TTTGTTTCTG TAGAAAATAA AACTGAGCTA 

Seq ID NO: 587 Protein sequence 
Protein Accession #: NP_001318.1 

35 1 11 21 31 41 51 

I I I I 1 1 

MQAEGRGTGG STGDADGPGG PG I PDGPGGN AGGPGEAGAT GGRGPRGAGA ARASGPGGGA 60 
PRGPHGGAAS GLNGCCRCGA RGPESRLLEF YLAMPFATPM EAELARRSLA QDAPPLPVPG 120 
VLLKEFTVSG NILTIRLTAA DHRQLQLSIS SCLQQLSLLM WITQCFLPVF LAQPPSGQRR 



Seq ID NO: 588 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 52.. 459 



45 1 11 21 31 41 51 

I I I I I I 

CCTCGTGGGC CCTGACCTTC TCTCTGAGAG CCGGGCAGAG GCTCCGGAGC CATGCAGGCC 60 

GAAGGCCAGG GCACAGGGGG TTCGACGGGC GATGCTGATG GCCCAGGAGG CCCTGGCATT 12 0 

CCTGATGGCC CAGGGGGCAA TGCTGGCGGC CCAGGAGAGG CGGGTGCCAC GGGCGGCAGA 180 

50 GGTCCCCGGG GCGCAGGGGC AGCAAGGGCC TCGGGGCCGA GAGGAGGCGC CCCGCGGGGT 240 

CCGCATGGCG GTGCCGCTTC TGCGCAGGAT GGAAGGTGCC CCTGCGGGGC CAGGAGGCCG 300 

GACAGCCGCC TGCTTCAGTT CCGACTGACT GCTGCAGACC ACCGCCAACT GCAGCTCTCC 360 

ATCAGCTCCT GTCTCCAGCA GCTTTCCCTG TTGATGTGGA TCACGCAGTG CTTTCTGCCC 420 

GTGTTTTTGG CTCAGGCTCC CTCAGGGCAG AGGCGCTAAG CCCAGCCTGG CGCCCCTTCC 480 

55 TAGGTCATGC CTCCTCCCCT AGGGAATGGT CCCAGCACGA GTGGCCAGTT CATTGTGGGG 540 

GCCTGATTGT TTGTCGCTGG AGGAGGACGG CTTACATGTT TGTTTCTGTA GAAAATAAAG 600 
CTGAGCTA 

Seq ID NO: 589 Protein sequence 
60 Protein Accession #: Eos sequence 

1 11 21 31 41 51 

1 1 I 1 I I 

MQAEGQGTGG STGDADGPGG PG I PDGPGGN AGGPGEAGAT GGRGPRGAGA ARASGPRGGA 60 

65 PRGPHGGAAS AQDGRCPCGA RRPDSRLLQF RLTAADHRQL QLSISSCLQQ LSLLMWITQC 120 
FLPVFLAQAP SGQRR 

Seq ID NO: 590 DNA sequence 
Nucleic Acid Accession ft: NM_005562.1 
70 Coding sequence: 90.. 3671 

1 11 21 31 41 51 

I I I I I I 

ACAGCGGAGC GCAGAGTGAG AACCACCAAC CGAGGCGCCG GGCAGCGACC CCTGCAGCGG 60 

75 AGACAGAGAC TGAGCGGCCC GGCACCGCCA TGCCTGCGCT CTGGCTGGGC TGCTGCCTCT 12 0 

GCTTCTCGCT CCTCCTGCCC GCAGCCCGGG CCACCTCCAG GAGGGAAGTC TGTGATTGCA 180 

ATGGGAAGTC CAGGCAGTGT ATCTTTGATC GGGAACTTCA CAGACAAACT GGTAATGGAT 240 

TCCGCTGCCT CAACTG CAAT GACAACACTG ATGGCATTCA CTGCGAGAAG TGCAAGAATG 30 0 

GCTTTTACCG GCACAGAGAA AGGGACCGCT GTTTGCCCTG CAATTGTAAC TCCAAAGGTT 360 

80 CTCTTAGTGC TCGATGTGAC AACTCTGGAC GGTGCAGCTG TAAACCAGGT GTGACAGGAG 420 

CCAGATGCGA CCGATGTCTG CCAGGCTTCC ACATGCTCAC GGATGCGGGG TGCACCCAAG 480 

ACCAGAGACT GCTAGACTCC AAGTGTGACT GTGACCCAGC TGGCATCGCA GGGCCCTGTG 540 

ACGCGGGCCG CTGTGTCTGC AAGCCAGCTG TTACTGGAGA ACGCTGTGAT AGGTGTCGAT 600 

CAGGTTACTA TAATCTGGAT GGGGGGAACC CTGAGGGCTG TACCCAGTGT TTCTGCTATG 660 

85 GGCATTCAGC CAGCTGCCGC AGCTCTGCAG AATACAGTGT CCATAAGATC ACCTCTACCT 720 

TTCATCAAGA TGTTGATGGC TGGAAGGCTG TCCAACGAAA TGGGTCTCCT GCAAAGCTCC 780 

AATGGT CACA GCGCCATCAA GATGTGTTTA GCTCAGCCCA ACGACTAGAC CCTGTCTATT 840 



414 



WO 02/086443 

TTGTGGCTCC TGCCAAATTT CTTGGGAATC AACAGGTGAG CTATGGGCAA AGCCTGTCCT 90 0 

TTGACTACCG TGTGGACAGA GGAGGCAGAC ACCCATCTGC CCATGATGTG ATTCTGGAAG 960 

GTGCTGGTCT ACGGAT CACA GCTCCCTTGA TGCCACTTGG CAAGACACTG CCTTGTGGGC 1020 

TCACCAAGAC TTACACATTC AGGTTAAATG AGCATCCAAG CAATAATTGG AGCCCCCAGC 1080 

TGAGTT ACT T TGAGTATCGA AGGTTACTGC GGAATCTCAC AGCCCTCCGC ATCCGAGCTA 1140 

CATATGGAGA ATACAGTACT GGGTACATTG ACAATGTGAC CCTGATTTCA GCCCGCCCTG 1200 

TCTCTGGAGC CCCAGCACCC TGGGTTGAAC AGTGTATATG TCCTGTTGGG TACAAGGGGC 1260 

' AATTCTGCCA GGATTGTGCT TCTGGCTACA AGAGAGATTC AGCGAGACTG GGGCCTTTTG 1320 

GCACCTGTAT TCCTTGTAAC TGTCAAGGGG GAGGGGCCTG TGATCCAGAC ACAGGAGATT 13 80 

GTTATTCAGG GGATGAGAAT CCTGACATTG AGTGTGCTGA CTGCCCAATT GGTTTCTACA 1440 

ACGATCCGCA CGACCCCCGC AGCTGCAAGC CATGTCCCTG TCATAACGGG TTCAGCTGCT 1500 

CAGTGATGCC GGAGACGGAG GAGGTGGTGT GCAATAACTG CCCTCCCGGG GTCACCGGTG 1560 

CCCGCTGTGA GCTCTGTGCT GATGGCTACT TTGGGGACCC CTTTGGTGAA CATGGCCCAG 1620 

TGAGGCCTTG TCAGCCCTGT CAATGCAACA ACAATGTGGA CCCCAGTGCC TCTGGGAATT 1680 

GTGACCGGCT GACAGGCAGG TGTTTGAAGT GTATCCACAA CACAGCCGGC ATCTACTGCG 1740 

ACCAGTGCAA AGCAGGCTAC TTCGGGGACC CATTGGCTCC CAACCCAGCA GACAAGTGTC 1800 

GAGCTTGCAA CTGTAACCCC ATGGGCTCAG AGCCTGTAGG ATGTCGAAGT GATGGCACCT 1860 

GTGTTTGCAA GCCAGGATTT GGTGGCCCCA ACTGTGAGCA TGGAGCATTC AGCTGTCCAG 1920 

CTTGCTATAA TCAAGTGAAG ATT CAGATGG ATCAGTTTAT GCAGCAGCTT CAGAGAATGG 1980 

AGGCCCTGAT TTCAAAGGCT CAGGGTGGTG ATGGAGTAGT ACCTGATACA GAGCTGGAAG 2040 

GCAGGATGCA GCAGGCTGAG CAGGCCCTTC AGGACATTCT GAGAGATGCC CAGATTTCAG 2100 

AAGGTGCTAG CAGAT CCCTT GGTCTCCAGT TGGCCAAGGT GAGGAGCCAA GAGAACAGCT 2160 

ACCAGAGCCG CCTGGATGAC CTCAAGATGA CTGTGGAAAG AGTTCGGGCT CTGGGAAGTC 2220 

AGTACCAGAA CCGAGTTCGG GATACTCACA GGCTCATCAC TCAGATGCAG CTGAGCCTGG 22 80 

CAGAAAGTGA AGCTTCCTTG GGAAACACTA ACATTCCTGC CTCAGACCAC TACGTGGGGC 2340 

CAAATGGCTT TAAAAGTCTG GCTCAGGAGG CCACAAGATT AGCAGAAAGC CACGTTGAGT 2400 

CAGCCAGTAA CATGGAGCAA CTGACAAGGG AAACTGAGGA CTATTCCAAA CAAGCCCTCT 2460 

CACTGGTGCG CAAGGCCCTG CATGAAGGAG TCGGAAGCGG AAGCGGTAGC CCGGACGGTG 2520 

CTGTGGTGCA AGGGCTTGTG GAAAAATTGG AGAAAACCAA GTCCCTGGCC CAGCAGTTGA 2580 

CAAGGGAGGC CACTCAAGCG GAAATTGAAG CAGATAGGTC TTATCAGCAC AGTCTCCGCC 2640 

TCCTGGATTC AGTGTCTCGG CTTCAGGGAG TCAGTGATCA GTCCTTTCAG GTGGAAGAAG 2700 

CAAAGAGGAT CAAACAAAAA GCGGATTCAC TCTCAACGCT GGTAACCAGG CATATGGATG 2760 

AGTTCAAGCG TACACAAAAG AAT CTGGGAA ACTGGAAAGA AGAAGCACAG CAGCTCTTAC 2 82 0 

AGAATGGAAA AAGTGGGAGA GAG AAAT C AG ATCAGCTGCT TTCCCGTGCC AATCTTGCTA 2 8 80 

AAAG C AG AG C ACAAGAAGCA CTGAGTATGG GCAATGCCAC TTTTTATGAA GTTGAGAGCA 2 940 

TCCTTAAAAA CCTCAGAGAG TTTGACCTGC AGGTGGACAA CAGAAAAGCA GAAGCTGAAG 3 000 

AAGCCATGAA GAGACTCTCC TACATCAGCC AGAAGGTTTC AGATGCCAGT GACAAGACCC 3 060 

AGCAAGCAGA AAGAGCCCTG GGGAGCGCTG CTGCTGATGC ACAGAGGGCA AAGAATGGGG 3120 

CCGGGGAGGC CCTGGAAATC TCCAGTGAGA TTGAACAGGA GATTGGGAGT CTGAACTTGG 3180 

AAGCCAATGT GACAGCAGAT GGAGCCTTGG CCATGGAAAA GGGACTGGCC TCTCTGAAGA 3240 

GTGAGATGAG GGAAGTGGAA GGAGAGCTGG AAAGGAAGGA GCTGGAGTTT GACACGAATA 3300 

TGGATGCAGT ACAGATGGTG ATTACAGAAG CCCAGAAGGT TGATACCAGA GCCAAGAACG 33 60 

CTGGGGTTAC AATCCAAGAC ACACTCAACA CATTAGACGG CCTCCTGCAT CTGATGGACC 3420 

AGCCTCTCAG TGTAGATGAA GAGGGGCTGG TCTTACTGGA GCAGAAGCTT TCCCGAGCCA 3 480 

AGACCCAGAT CAACAGCCAA CTGCGGCCCA TGATGTCAGA GCTGGAAGAG AGGGCACGTC 3 540 

AG CAGAGGGG CCACCTCCAT TTGCTGGAGA CAAGCATAGA TGGGATTCTG GCTGATGTGA 3 600 

AGAACTTGGA GAACATTAGG GACAACCTGC CCCCAGGCTG CTACAATACC CAGGCTCTTG 3 660 

AGCAACAGTG AAGCTGCCAT AAATATTTCT CAACTGAGGT TCTTGGGATA CAGAT CTCAG 3 720 

GGCTCGGGAG CCATGT CATG TGAGTGGGTG GGATGGGGAC ATTTGAACAT GTTTAATGGG 3 7 80 

TATGCTCAGG TCAACTGACC TGACCCCATT CCTGATCCCA TGGCCAGGTG GTTGTCTTAT 3 840 

TGCACCATAC TCCTTGCTTC CTGATGCTGG GCAATGAGGC AGATAGCACT GGGTGTGAGA 3 900 

ATGATCAAGG ATCTGGACCC CAAAGAATAG ACTGGATGGA AAGACAAACT GCACAGGCAG 3 960 

ATGTTTGCCT CATAATAGTC GTAAGTGGAG TCCTGGAATT TGGACAAGTG CTGTTGGGAT 402 0 

ATAGTCAACT TATTCTTTGA GTAATGTGAC TAAAGGAAAA AACTTTGACT TTGCCCAGGC 40 80 

ATGAAATTCT TCCTAATGTC AGAACAGAGT GCAACCCAGT CACACTGTGG CCAGTAAAAT 4140 

ACTATTGCCT CATATTGTCC TCTGCAAGCT TCTTGCTGAT CAGAGTTCCT CCTACTTACA 4200 

ACCCAGGGTG TGAACATGTT CTCCATTTTC AAGCTGGAAG AAGTGAGCAG TGTTGGAGTG 42 60 

AGGACCTGTA AGGCAGGCCC ATTCAGAGCT ATGGTGCTTG CTGGTGCCTG CCACCTTCAA 432 0 

GTTCTGGACC TGGGCATGAC ATCCTTTCTT TTAATGATGC CATGGCAACT T AGAGAT TGC 43 80 

ATTTTTATTA AAGCATTTCC TACCAGCAAA GCAAATGTTG GGAAAGTATT TACTTTTTCG 4440 

GTTTCAAAGT GATAGAAAAG TGTGGCTTGG GCATTGAAAG AGGTAAAATT CT C TAG AT T T 4500 

ATTAGTCCTA ATTCAATCCT ACTTTTCGAA CACCAAAAAT GATGCG CATC AATGTATTTT 4560 

ATCTTATTTT CTCAATCTCC TCTCTCTTTC CTCCACCCAT AATAAGAGAA TGTTCCTACT 4620 

CACACTTCAG CTGGGTCACA TCCATCCCTC CATT CATCCT TCCATCCATC TTTCCATCCA 4680 

TTACCTCCAT CCATCCTTCC AACATATATT TATTGAGTAC CTACTGTGTG CCAGGGGCTG 4740 

GTGGGACAGT GGTGACATAG TCTCTGCCCT CATAGAGTTG ATTGTCTAGT GAGGAAGACA 4 800 

AGCATTTTTA AAAAATAAAT TTAAACTTAC AAACTTTGTT TGTCACAAGT GGTGTTTATT 4860 

GCAATAACCG CTTGGTTTGC AACCTCTTTG CTCAACAGAA CATATGTTGC AAGACCCTCC 4920 

CATGGGGGCA CTTGAGTTTT GGCAAGGCTG ACAGAGCTCT GGGTTGTGCA CATTTCTTTG 4980 

CATTCCAGCT GTCACTCTGT GCCTTTCTAC AACTGATTGC AACAGACTGT TGAGTTATGA 5040 

TAACACCAGT GGGAATTGCT GGAGGAACCA GAGGCACTTC CACCTTGGCT GGGAAGACTA 5100 

TGGTGCTGCC TTGCTTCTGT ATTTCCTTGG ATTTTCCTGA AAGTGTTTTT AAATAAAGAA 5160 
CAATTGTTAG ATGCC 

Seq ID NO: 591 Protein sequence 
Protein Accession #: NP_005553.1 

I 11 21 31 41 51 

II | I I 1 

MPALWLGCCL CFSLLLPAAR ATSRREVCDC NGKSRQCIFD RELHRQTGNG FRCLNCNDNT 60 

DGIHCEKCKN GFYRHRERDR CLPCNCNSKG SLSARCDNSG RCSCKPGVTG ARCDRCLPGF 120 

HMLTDAGCTQ DQRLLDSKCD CDPAGIAGPC DAGRCV CKP A VTGERCDRCR SGYYNLDGGN 180 

PEGCTQCFCY GHSASCRSSA EYSVHKITST FHQDVDGWKA VQRNGSPAKL QWSQRHQDVF 240 

SSAQRLDPVY FVAPAKFLGN QQVSYGQSLS FDYRVDRGGR HPSAHDVILE GAGLRITAPL 3 00 

MPLGKTLPCG LTKTYTFRLN EHPSNNWSPQ LSYFEYRRLL RNLTALRIRA TYGEYSTGYI 360 

DNVTLISARP VSGAPAPWVE QCICPVGYKG QFCQDCASGY KRDSARLGPF GTCIPCNCQG 420 

GGACD PDTGD CYSGDENPDI ECADCPIGFY NDPHDPRSCK PCPCHNGFSC SVMPETEEW 480 
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FGDPFGEHGP 
PLAPNPADKC 
DQFMQQLQRM 
LAKVRSQENS 
NIPASDHYVG 
VGSGSGSPDG 
VSDQSFQVEE 
DQLLSRANLA 
QKVSDASDKT 
AMEKGLASLK 
TLDGLLHLMD 
TSIDGILADV 



VRPCQPCQCN 
RACNCNPMGS 
EALISKAQGG 
YQSRLDDLKM 
PNGFKSLAQE 
AWQGLVEKL 
AKRIKQKADS 
KSRAQEALSM 
QQAERALGSA 
SEMREVEGEL 
QPLSVDEEGL 
KNLENIRDNL 



NNVDPSASGN 
EPVGCRSDGT 
DGWPDTELE 
TVERVRALGS 
ATRLAESHVE 
EKTKSLAQQL 
LSTLVTRHMD 
GNATFYEVES 
AADAQRAKNG 
ERKELEFDTN 
VLLEQKLSRA 
PPGCYNTQAL 



Seq ID NO: 592 DNA sequence 

Nucleic Acid Accession #: AF101051.1 

Coding sequence: 221.856 



GAGCAACCTC 
CGACCCAGAG 
GCGGGGCCCA 
ACCTGCCACC 
GCTGTTGGGC 
GCCCCAGTGG 
CGAGGGGCTG 
TGACTCCTTG 
CATCCTCCTG 
CTTGGAAGAC 
TCTTGCAGGT 
ATTCTATGAC 
TGGCTGGGCT 
CCGAAAAACA 
GAAAGACTAC 
GGACATTGAG 
GTATGGTATT 
AAACATGGCT 
TTGTATTACT 
TATATATAGA 
CTCATTATGT 
CCATATTGAT 
CAGTCAAATA 
CTAATTTACC 
TTATTTTTTA 
TTTCATTGGT 
AGCCAAGAAG 
GTGATAAATT 
TTTGCTTTGA 
CACAACTTTA 
ACCTTTTTGT 
TATATCTTCC 
GATAATCTGG 
TCTTTTTTCT 
AATATTAATT 
TTTATTTGCT 
CTTCATGTGA 
ACACATACCT 
AAACCTACGC 
ATTCTTTCAG 
TTTCCAGTCT 
GCACTGGTGT 
AGCAAGGCAT 
CTGATCTTCC 
GTGGTTTTGT 
CGTTTTGGTG 
GCCTTAACCA 
AAGATTCTGA 
ACAGATGTAA 
TTTTGAATCA 
TGTTAGCTGG 
CTACACAAGG 
TGCCTTCCAA 
ATACATAGAT 
ACAAAAAAAT 
TTTGATCTTT 
TTATAATGGG 
AAAAGGAAAA 



11 

I 

AGCTTCTAGT 
CTTCTCCAGC 
GCCACCTTCG 
CCTGAGCCAG 
TTCATTCTCG 
AGGATTTACT 
TGGATGTCCT 
CTGAATCTGA 
GGAGTGATAG 
GATGAGGTGC 
CTGGCTATTT 
CCTATGACCC 
GCTGCTTCTC 
ACCTCTTACC 
GTGTGACACA 
ATACTATCAT 
ACAAAACAAA 
TAATCTTATT 
GCTTCCCATT 
TATGTATATA 
TGATACTAGC 
GAAGATGTTT 
TCATTTACTC 
AAGGATGAAT 
CCATAATCTT 
CTCTATCTCC 
AATTTATTAC 
CCTGTTGACC 
AAATATTTGT 
TTGATTGAAT 
TCCGCATTCC 
TAATAAGGTG 
TGACAAATAT 
ATCTGCCAAA 
AGTTTATATT 
CAGCTGGCTG 
TTCACTGCCT 
TCATGTGGTT 
ACATACCTTC 
CTGTGTCTGA 
GTACAGAATG 
CTGGAGACCT 
TTGGCTGCTG 
CACCTCACAG 
AATTTGAAAA 
TTGCTTTTCA 
GTCTCTCAAG 
GGAAGTCTTA 
TGGGAAGAAA 
TAATAACTCA 
CAGCTGACGC 
AAAGTCAGCC 
ACCTGAGAAT 
CTTCATGATG 
TTTATGGCCC 
TTATATTCTT 
AATTTGTATA 
AAAAAAAAAA 



21 
I 

AT CCAGACTC 
GGCGGCGCAG 
GGAGTCCGGG 
CGCGGGCGCC 
CCTTCCTGGG 
CCTATGCCGG 
GCGTGTCGCA 
GCAG CACATT 
CAATCTTTGT 
AGAAGATGAG 
TAGTTGCCAC 
CAGTCAATGC 
TCTGCCTTCT 
CAACACCAAG 
GAGGCAAAAG 
TAACATTAGG 
CAAACAAACA 
TTATCTTCTT 
GAGTAATCAT 
TACATGTTTT 
ATACTTAAAA 
ATTGGTATAT 
TTCTTCATTA 
TCTTTCAATT 
ATAGCACTTG 
TGAATCTAAC 
AAATCAGAAC 
TTCCCACACA 
CCAATTGAGT 
TTTTAAGCTA 
TTAATTGTAT 
TGGTCTGTTT 
TCTCTCTGTA 
TTGAGATAAT 
ACTCTCATTC 
AGACACTGAA 
TCCTCTCTCT 
CAGTGCCTTC 
ATGTGGCTCA 
CATGTTTGTG 
CTATTTCACT 
GGATTTGAGT 
TAAGCTTATT 
TGATGTTGTG 
GTGCTATACT 
AATGTTTGAA 
TGATGAGACA 
TCTTCTGCAG 
TAAAAGCCTA 
TAAGGTGCTA 
TGCTAGGATA 
ACCGTGTCTT 
ATATG CTTTT 
TGTGAGTGTA 
AAAATGACCA 
CTACCACACC 
AAGCATTACT 
AAA 



31 

! 

CAGCGCCGCC 

CGAGCAGGGC 

TTGCCCACCT 

CGAGCGAGTC 

ATGGATCGGC 

CGACAACATC 

GAGCACCGGG 

GCAAGCAACC 

GGCCACCGTT 

GATGGCTGTC 

AGCATGGTAT 

CAGGTACGAA 

GGGAGGTGCC 

GCCCTATCCA 

GAGAAAATCA 

ACCTTAGAAT 

AAAAACCCAT 

TCCT CAAT AT 

ACTCAAATGG 

TCTATTAAAA 

TATCTCTAAA 

TTTCTTTTTC 

GCTTTGGGTG 

CTTCATGCGT 

CATCGTTATT 

ACATTTCATA 

TTTGGAGGCA 

ATCCCTGTAC 

AGCTGCATGC 

CTTATTCATA 

TGTTTTCCCA 

GTCTGAACAA 

GCTGTAAGCA 

GATACTTAAC 

TTTGAACATG 

GAAGTCACTG 

ACCAGTCTAT 

CTCTCTCTAC 

GTGCCTTCCT 

CTCTGTTCCA 

TGAGCAAGAT 

CTTGGTGCTA 

GCTTCATCTG 

GGGAT CCAGT 

AAGGGAAAGA 

AATAAAAAAA 

GTGAAGTAAA 

TGAGTATGGC 

CGTGTTGGTA 

TCTGTTCAGT 

GTTAGTTTGG 

ATGAGGAATT- 

GGAAGTTAAA 

ATTCCATGTG 

ACGAAATTGT 

TGGAAACAGA 

CTTTT T CAAT 



41 

I 

CCGGGCGCGG 
TCCCCGCCTT 
GCAAACTCTC 
ATGGCCAACG 
GCCATCGTCA 
GTGACCGCCC 
CAGAT CCAGT 
CGTGCCTTGA 
GGCATGAAGT 
ATTGGGGGTG 
GGCAATAGAA 
TTTGGTCAGG 
CTACTTTGCT 
AAACCTGCAC 
TGTTGAAACA 
TTTGGGTATT 
GTGTTAAAAT 
AGGAGGGAAG 
GGGAAGGGGT 
ATAGACAGTA 
ATAGGTAAAT 
GTCCTTATAT 
CCTTTGCCAC 
GCCCTTTTCA 
AAGCCCTTAT 
GCCTACATTT 
AATCTTTCTG 
TCTGACCCAT 
TGTTCCCCCA 
GTTTTATATC 
AGTGTAATTA 
AGTGCTAGAC 
AGTCACTTAA 
CAGTTAGAAG 
AACTATGCCT 
AACAAAACCT 
TTCCACTGAA 
CAGTCTATTT 
CTCTCTACCA 
TTTTAACAAC 
GATGTATGGA 
TCAATCACCG 
TAAGCGGTGG 
GAGATAGAAT 
ATTGAGGAAT 
TGTTAAGAAA 
ATTGAGTGCA 
CCAATGCTTT 
AAT C CAACAG 
GATGCCCTCA 
AAATGGTACT 
GGACCTAATA 
ATTTAAATGG 
GATATCAGTT 
TACAATAGAA 
CCAATAGACA 
AAATTGTTTT 



CDRLTGRCLK 


540 


CVCKPGFGGP 


S* r\ r\ 

600 


GRMQQAEQAL 


660 


QYQNRVRDTH 


720 


SASNMEQLTR 


780 


TREATQAEIE 


840 


EFKRTQKNLG 


900 


ILKNLREFDL 


960 


AGEALEISSE 


1020 


MDAVQMVITE 


1080 


KTQINSQLRP 


1140 


EQQ 




51 
i 




1 

ACCCCAACCC 


60 


AACTTCCTCC 


120 


CGCCTTCTGC 


180 


CGGGGCTGCA 


240 


GCACTGCCCT 


300 


AGGCCATGTA 


360 


GCAAAGTCTT 


420 


TGGTGGTTGG 


480 


GT AT G AAGTG 


540 


CGATATTTCT 


600 


TCGTT C AAGA 


660 


CTCTCTTCAC 


r*t n a 

720 


GTTCCTGTCC 


780 


CTTCCAGCGG 


840 


AACCGAAAAT 


r> f\ r\ 

900 


GTAATCTGAA 


960 


ACTCAGTGCT 


1020 


ATTTTACCAT 


1080 


GCTCCTTAAA 


1140 


AAATACTATT 


1200 


GTATTTAATT 


1260 


ACATATGTAA 


1320 


AAGACCTAGC 


1380 


TATACTTATT 


1440 


TTGTTTTGTG 


1500 


TAGTTTCTAA 


1560 


CATGACCAAA 


1620 


AGCACTCTTG 


1680 


GGTGTTGTAA 


1740 


CCCCTAAACT 


1800 


TCATGCGTTT 


1860 


TTTCTGGAGT 


1920 


TCTTTCTACC 


1980 


AGGTAGTGTG 


2040 


ATGTAGTGTC 


2100 


ACACACGTAC 


2160 


CAAAACCTAC 


2220 


CCACTGAACA 


2280 


GTCTATTTCC 


2340 


TGCTCTTACT 


2400 


AAGGGTGTTG 


2460 


TCTGTGTTTG 


2520 


TTTGTAATTC 


2580 


ACATGTAAGT 


2640 


TAACTGCATA 


2700 


TGGGTTTCTT 


2760 


CTAAACGAAT 


2820 


CTGTGGCTAA 


r^i n A 

2880 


CAAGGGAGAT 


2940 


GAGCTCTTGC 


3000 


T CAT AAT AAA 


3060 


AATTTTAGTG 


3120 


CTTTTGCCAC 


3180 


ACCAAACATT 


3240 


TTTATCCAAT 


3300 


TTTTGGGGTT 


3360 


TTAATTTAAA 


3420 



85 



Seq ID NO: 593 Protein sequence 
Protein Accession #: AAD16433.1 

1 11 21 31 41 51 

1 I I I I I 

MANAGLQLLG FILAFLGWIG AIVSTALPQW RIYSYAGDNI VTAQAMYEGL WMSCVSQSTG 

QIQCKVFDSL LNLSSTLQAT RALMWG ILL GVIAIFVATV GMKCMKCLED DEVQKMRMAV 

IGGAIFLLAG LA I LVATAW Y GNRIVQEFYD PMTPVNARYE FGQALFTGWA AASLCLLGGA 

LLCCSCPRKT TSYPTPRPYP KPAP.SSGKDY V 



60 
120 
180 
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Seq ID NO: 594 DNA sequence 

Nucleic Acid Accession #: NM_006180.1 

Coding sequence: 352.. 2820 

1 11 21 31 41 51 

I 1 I 1 I I 

CCCCCATTCG CAT CTAAC AA GGAATCTGCG CCCCAGAGAG TCCCGGACGC CGCCGGTCGG 60 

TGCCCGGCGC GCCGGGCCAT GCAGCGACGG CCGCCGCGGA GCTCCGAGCA GCGGTAGCGC 120 

10 CCCCCTGTAA AGCGGTTCGC TATGCCGGGA CCACTGTGAA CCCTGCCGCC TGCCGGAACA 180 

CTCTTCGCTC CGGACCAGCT CAGCCTCTGA TAAGCTGGAC TCGGCACGCC CGCAACAAGC 240 

ACCGAGGAGT TAAGAGAGCC GCAAGCGCAG GGAAGGCCTC CCCGCACGGG TGGGGGAAAG 3 00 

CGGCCGGTGC AGCGCGGGGA CAGGCACTCG GGCTGGCACT GGCTGCTAGG GATGTCGTCC 3 60 

TGGATAAGGT GGCATGGACC CGCCATGGCG CGGCTCTGGG GCTTCTGCTG GCTGGTTGTG 42 0 

15 GGCTTCTGGA GGGCCGCTTT CGCCTGTCCC ACGTCCTGCA AATGCAGTGC CTCTCGGATC 480 

TGGTGCAGCG ACCCTTCTCC TGGCATCGTG GCATTTCCGA GATTGGAGCC TAACAGTGTA 540 

GATCCTGAGA ACATCACCGA AATTTTCATC GCAAACCAGA AAAGGT TAG A AAT CAT CAAC 600 

GAAGATGATG TTGAAGCTTA TGTGGGACTG AGAAAT CTGA CAAT TGTGG A TTCTGGATTA 660 

AAATTTGTGG CTCATAAAGC ATTTCTGAAA AACAGCAACC TGCAGCACAT CAATTTTACC 720 

20 CGAAACAAAC TGACGAGTTT GTCTAGGAAA CATTTCCGTC ACCTTGACTT GTCTGAACTG 780 

ATCCTGGTGG GCAATCCATT TACATGCTCC TGTGACATTA TGTGGATCAA GACTCTCCAA 840 

GAGGCTAAAT CCAGTCCAGA CACTCAGGAT TTGTACTGCC TGAATGAAAG CAGCAAGAAT 90 0 

ATTCCCCTGG CAAACCTGCA GATACCCAAT TGTGGTTTGC CATCTGCAAA TCTGGCCGCA 960 

CCTAACCTCA CTGTGGAGGA AGGAAAGTCT AT CACATTAT CCTGTAGTGT GGCAGGTGAT 102 0 

25 CCGGTTCCTA ATATGTATTG GGATGTTGGT AACCTGGTTT CCAAACATAT GAATGAAACA 1080 

AGCCACACAC AGGGCTCCTT AAGGATAACT AACATTTCAT CCGATGACAG TGGGAAGCAG 1140 

ATCTCTTGTG TGGCGGAAAA TCTTGTAGGA GAAGATCAAG ATTCTGTCAA CCTCACTGTG 1200 

CATTTTGCAC CAAC TAT C AC ATTTCTCGAA TCTCCAACCT CAGACCACCA CTGGTGCATT 12 60 

CCATTCACTG TGAAAGGCAA CCCCAAACCA GCGCTTCAGT GGTTCTATAA CGGGGCAATA 1320 

30 TTGAATGAGT CCAAATACAT CTGTACTAAA ATACATGTTA CCAATCACAC GGAGTACCAC 1380 

GGCTGCCTCC AGCTGGATAA TCCCACTCAC ATGAACAATG GGGACTACAC TCTAATAGCC 1440 

AAGAATGAGT ATGGGAAGGA TGAGAAACAG ATTTCTGCTC ACTT CATGGG CTGGCCTGGA 1500 

ATTGACGATG GTGCAAACCC AAATTATCCT GATGTAATTT ATGAAGATTA TGGAACTGCA 1560 

GCGAATGACA TCGGGGACAC CACGAACAGA AGTAATGAAA TCCCTTCCAC AG ACGT CACT 1620 

35 GATAAAACCG GTCGGGAACA TCTCTCGGTC TATGCTGTGG TGGTGATTGC GTCTGTGGTG 1680 

GGATTTTGCC TTTTGGTAAT GCTGTTTCTG CTTAAGTTGG CAAG AC ACT C CAAGTTTGGC 1740 

ATGAAAGGCC CAGCCTCCGT TATCAGCAAT GATGATGACT CTGCCAGCCC ACTCCATCAC 180 0 

ATCTCCAATG GGAGTAACAC TCCATCTTCT TCGGAAGGTG GCCCAGATGC TGTCATTATT 1860 

GGAATGACCA AGATCCCTGT CATTGAAAAT CCCCAGTACT TTGGCAT C AC CAACAGTCAG 1920 

40 CTCAAGCCAG ACACATTTGT TCAGCACATC AAGCGACATA ACATTGTTCT GAAAAGGGAG 1980 

CTAGGCGAAG GAGCCTTTGG AAAAGTGTTC CTAGCTGAAT GCTATAACCT CTGTCCTGAG 2040 

CAGGACAAGA TCTTGGTGGC AGTGAAGACC CTGAAGGATG CCAGTGACAA TGCACGCAAG 2100 

GACTTCCACC GTGAGGCCGA GCTCCTGACC AACCTCCAGC ATGAGCACAT CGTCAAGTTC 2160 

TATGGCGTCT GCGTGGAGGG CGACCCCCTC AT CATGGT CT TTGAGTACAT GAAGCATGGG 222 0 

45 GACCTCAACA AGTTCCTCAG GGCACACGGC CCTGATGCCG TGCTGATGGC TGAGGGCAAC 2280 

CCGCCCACGG AACTGACGCA GTCGCAGATG CTGCATATAG CCCAGCAGAT CGCCGCGGGC 2340 

ATGGTCTACC TGGCGTCCCA GCACTTCGTG CACCGCGATT TGGCCACCAG GAACTGCCTG 2400 

GTCGGGGAGA ACTTGCTGGT GAAAATCGGG GACTTTGGGA TGTCCCGGGA CGTGTACAGC 2460 

ACTGACTACT ACAGGGTCGG TGGCCACACA ATGCTGCCCA TTCGCTGGAT GCCTCCAGAG 2520 

50 AGCATCATGT ACAGGAAATT CACGACGGAA AGCGACGTCT GGAGCCTGGG GGTCGTGTTG 2580 

TGGGAGATTT TCACCTATGG CAAACAGCCC TGGTACCAGC TGTCAAACAA TGAGGTGATA 2 640 

GAGTGTATCA CTCAGGGCCG AGTCCTGCAG CGACCCCGCA CGTGCCCCCA GGAGGTGTAT 2 70 0 

GAG CTGATGC TGGGGTGCTG GCAGCGAGAG CCCCACATGA GGAAGAACAT CAAGGGCATC 2760 

CATACCCTCC TTCAGAACTT GGCCAAGGCA TCTCCGGTCT ACCTGGACAT T CT AGGCT AG 2820 

55 GGCCCTTTTC CCCAGACCGA TCCTTCCCAA CGTACTCCTC AGACGGGCTG AGAGGATGAA 2880 

CATCTTTTAA CTGCCGCTGG AGGCCACCAA GCTGCTCTCC TTCACTCTGA CAGTATTAAC 2 940 

ATCAAAGACT CCGAGAAGCT CT CGAGGGAA GCAGTGTGTA CTTCTTCATC CATAGACACA 3000 

GTATTGACTT CTTTTTGGCA TTATCTCTTT CTCTCTTTCC ATCTCCCTTG GTTGTTCCTT 3060 

TTTCTTTTTT TAAATTTTCT TTTTCTTCTT TTTTTTCGTC TTCCCTGCTT CACGATTCTT 3120 

60 ACCCTTTCTT TTGAAT CAAT CTGGCTTCTG CATTACTATT AACTCTGCAT AGACAAAGGC 3180 

CTTAACAAAC GTAATTTGTT ATATCAGCAG ACACTCCAGT TTGCCCACCA CAACTAACAA 3240 

TGCCTTGTTG TATTCCTGCC TTTGATGTGG ATGAAAAAAA GGGAAAACAA ATATTTCACT 33 00 

TAAACTTTGT CACTTCTGCT GTACAGATAT CGAGAGTTTC TATGGATTCA CTTCTATTTA 33 60 

TTTAT TATTA TTACTGTTCT TATTGTTTTT GGATGGCTTA AGCCTGTGTA TAAAAAAGAA 3 420 

65 AACTTGTGTT CAATCTGTGA AGCCTTTATC TATGGGAGAT TAAAACCAGA GAGAAAGAAG 3480 

ATTTATTATG AACCGCAATA TGGGAGGAAC AAAGACAACC ACTGGGATCA GCTGGTGTCA 3540 

GTCCCTACTT AGGAAATACT CAGCAACTGT TAGCTGGGAA GAATGTATTC GGCACCTTCC 3600 

CCTGAGGACC TTTCTGAGGA GTAAAAAGAC TACTGGCCTC TGTGCCATGG ATGATTCTTT 3 660 
TCCCATCACC AGAAATGATA GCGTGCAGTA GAG AG C AAAG ATGGCTT 



70 



Seq ID NO: 595 Protein sequence 
Protein Accession #: NP 006171.1 



„ 1 11 21 31 41 51 

75 | I | | | I 

MSSWIRWHGP AMARLWGFCW LWGFWRAAF ACPTSCKCSA SRIWCSDPSP GIVAFPRLEP 60 

NSVDPENITE IFIANQKRLE I INEDDVEAY VGLRNLTIVD SGLKFVAHKA FLKNSNLQHI 120 

NFTRNKLTSL SRKHFRHLDL. SELILVGNPF TCSCDIMWIK TLQEAKSSPD TQDLYCLNES 180 

SKNIPLANLQ IPNCGLPSAN LAAPNLTVEE GKSITLSCSV AGDPVPNMYW DVGNLVSKHM 240 

80 NETSHTQGSL RITNI SSDDS GKQISCVAEN LVGEDQDSVN LTVHFAPTIT FLESPTSDHH 300 

WCIPFTVKGN PKPALQWFYN GAILNESKYI CTKIHVTNHT EYHGCLQLDN PTHMNNGDYT 360 

LIAKNEYGKD EKQISAHFMG WPGIDDGANP NYPDVIYEDY GTAANDIGDT TNRSNEIPST 420 

DVTDKTGREH LSVYAWVIA SWGFCLLVM LFLLKLARHS KFGMKGPASV ISNDDDSASP 480 

LHHI SNGSNT PSSSEGGPDA VIIGMTKIPV IENPQYFGIT NSQLKPDTFV QHIKRHNIVL 540 

85 KRELGEGAFG KVFLAECYNL CPEQDKILVA VKTLKDASDN ARKDFHREAE LLTNLOHEHI 600 

VKFYGVCVEG DPLIMVFEYM KHGDLNKFLR AHGPDAVLMA EGNPPTELTQ SQMLHIAQQI 660 

AAGMVYLASQ HFVHRDLATR NCLVGENLLV KIGDFGMSRD VYSTDYYRVG GHTMLPIRWM 720 
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WO 02/086443 

PPESIMYRKF TTESDVWSLG WLWEIFTYG KQPWYQLSNN EVIECITQGR VLQRPRTCPQ 
EVYELMLGCW QREPHMRKNI KGIHTLLQNL AKASPVYLDI LG 

Seq ID NO: 596 DNA sequence 
Nucleic Acid Accession #: AF410899 
Coding sequence: 483.. 2999 



PCT/US02/12476 



780 



75 



1 

1 

GGGAGCAGGA 
GCAGGAGCCT 
TGCATACCGG 
CCGCCGGTCG 
AGCGGTAGCG 
CTGCCGGAAC 
CCGCAACAAG 
GTGGGGGAAA 
GGATGTCGTC 
GGCTGGTTGT 
CCTCTCGGAT 
CTAACAGTGT 
AAATCATCAA 
ATT CTGGATT 
TCAATTTTAC 
TGTCTGAACT 
AGACTCTCCA 
GCAGCAAGAA 
ATCTGGCCGC 
TGGCAGGTGA 
TGAATGAAAC 
GTGGGAAGCA 
ACCTCACTGT 
ACTGGTGCAT 
ACGGGGCAAT 
CGGAGTACCA 
CTCTAATAGC 
GCTGGCCTGG 
ATGGAACTGC 
CAGACGTCAC 
CGTCTGTGGT 
CCAAGTTTGG 
GTGTTGGCCC 
TCTCCAATGG 
GAATGACCAA 
TCAAGCCAGA 
TAGGCGAAGG 
AGGACAAGAT 
ACTTCCACCG 
ATGGCGTCTG 
ACCTCAACAA 
CGCCCACGGA 
TGGTCTACCT 
TCGGGGAGAA 
CTGACTACTA 
GCATCATGTA 
GGGAGATTTT 
AGTGTAT CAC 
AGCTGATGCT 
ATACCCTCCT 
GCCCTTTTCC 
ATCTTTTAAC 
TCAAAGACTC 
TATTGACTTC 
TTCTTTTTTT 
CCCTTTCTTT 
TTAACAAACG 
GCCTTGTTGT 
AAACTTTGTC 
TT ATT AT TAT 
ACTTGTGTTC 
TTTATTATGA 
TCCCTACTTA 
CTGAGGACCT 
CCCATCACCA 
ATGGCGCATA 
TTGTTTCTCA 
ATGTCCAGAG 



11 
I 

GCCTCGCTGG 
GGACCCAGGC 
ACCCCCATTC 
GTGCCCGGCG 
CCCCCCTGTA 
ACTCTTCGCT 
CACCGAGGAG 
GCGGCCGGTG 
CTGGATAAGG 
GGGCTTCTGG 
CTGGTGCAGC 
AGATCCTGAG 
CGAAGATGAT 
AAAATTTGTG 
CCGAAACAAA 
GATCCTGGTG 
AGAGGCTAAA 
TATTCCCCTG 
ACCTAACCTC 
TCCGGTTCCT 
AAGCCACACA 
GATCTCTTGT 
GCATTTTGCA 
TCCATTCACT 
ATTGAATGAG 
CGGCTGCCTC 
CAAGAATGAG 
AATTGACGAT 
AGCGAATGAC 
TGATAAAACC 
GGGATTTTGC 
CATGAAAGAT 
AGCCTCCGTT 
GAGTAACACT 
GATCCCTGTC 
CACATTTGTT 
AGCCTTTGGA 
CTTGGTGGCA 
TGAGGCCGAG 
CGTGGAGGGC 
GTTCCTCAGG 
ACTGACGCAG 
GGCGTCCCAG 
CTTGCTGGTG 
CAGGGTCGGT 
CAGGAAATTC 
CACCTATGGC 
TCAGGGCCGA 
GGGGTGCTGG 
TCAGAACTTG 
CCAGACCGAT 
TGCCGCTGGA 
CGAGAAGCTC 
TTTTTGGCAT 
AAATTTTCTT 
TGAATCAATC 
TAATTTGTTA 
ATTCCTGCCT 
ACTTCTGCTG 
TACTGTTCTT 
AATCTGTGAA 
ACCGCAATAT 
GG AAAT ACT C 
TTCTGAGGAG 
GAAATGATAG 
GTGTGCTCGG 
AGCGCTATCC 
CTCATTTCGG 



21 
I 

CTGCTTCGCT 

GCCGGCGGCG 

GCATCTAACA 

CGCCGGGCCA 

AAGCGGTTCG 

CCGGACCAGC 

TTAAGAGAGC 

CAGCGCGGGG 

TGGCATGGAC 

AGGGCCGCTT 

GACCCTTCTC 

AACATCACCG 

GTTGAAGCTT 

GCT CAT AAAG 

CTGACGAGTT 

GGCAATCCAT- 

TCCAGTCCAG 

GCAAACCTGC 

ACTGTGGAGG 

AATATGTATT 

CAGGGCTCCT 

GTGGCGGAAA 

CCAACTATCA 

GTGAAAGGCA 

TCCAAATACA 

CAGCTGGATA 

TATGGGAAGG 

GGTGCAAACC 

ATCGGGGACA 

GGTCGGGAAC 

CTTTTGGTAA 

TTCTCATGGT 

ATCAGCAATG 

CCATCTTCTT 

ATTGAAAATC 

CAGCACATCA 

AAAGTGTTCC 

GTGAAGACCC 

CTCCTGACCA 

GACCCCCTCA 

GCACACGGCC 

TCGCAGATGC 

CACTTCGTGC 

AAAATCGGGG 

GGCCACACAA 

ACGACGGAAA 

AAACAGCCCT 

GTCCTGCAGC 

CAGCGAGAGC 

GCCAAGGCAT 

CCTTCCCAAC 

GGCCACCAAG 

TCGAGGGAAG 

TATCTCTTTC 

TTTCTTCTTT 

TGGCTTCTGC 

TATCAGCAGA 

TTGATGTGGA 

TACAGATATC 

ATTGTTTTTG 

GCCTTTATCT 

GGGAGGAACA 

AGCAACTGTT 

TAAAAAGACT 

CGTGCAGTAG 

ACACAGTTTT 

ACAGAACCTT 

GGTCAGGTGG 



31 
I 

CGCGCTCTAC 
GGCGTGAGGC 
AGGAATCTGC 
TGCAGCGACG 
CTATGCCGGG 
TCAGCCTCTG 
CGCAAGCGCA 
ACAGGCACTC 
CCGCCATGGC 
TCGCCTGTCC 
CTGGCATCGT 
AAATTTTCAT 
ATGTGGGACT 
CATTTCTGAA 
TGTCTAGGAA 
TTACATGCTC 
ACACTCAGGA 
AGATACCCAA 
AAGG AAAGT C 
GGGATGTTGG 
TAAGGATAAC 
ATCTTGTAGG 
CATTTCTCGA 
ACCCCAAACC 
TCTGTACTAA 
ATCCCACTCA 
ATGAGAAACA 
CAAATTATCC 
CCACGAACAG 
ATCTCTCGGT 
TGCTGTTTCT 
TTGGATTTGG 
ATGATGACTC 
CGGAAGGTGG 
CCCAGTACTT 
AGCGACATAA 
TAGCTGAATG 
TGAAGGATGC 
ACCTCCAGCA 
TCATGGTCTT 
CTGATGCCGT 
TGCATATAGC 
ACCGCGATTT 
ACTTTGGGAT 
TGCTGCCCAT 
GCGACGTCTG 
GGTACCAGCT 
GACCCCGCAC 
CCCACATGAG 
CTCCGGTCTA 
GTACTCCTCA 
CTGCTCTCCT 
CAGTGTGTAC 
TCT CTTTCCA 
TTTTTCGTCT 
ATTACTATTA 
CACTCCAGTT 
TGAAAAAAAG 
GAGAGTTTCT 
GATGGCTTAA 
ATGGG AG AT T 
AAGACAACCA 
AGCTGGGAAG 
ACTGGCCTCT 
AGAGCAAAGA 
GTCTTCGTAG 
TGTCAACTTC 
GAAAGCC 



41 

I 

GCGCTCAGTC 
GCCGGAGCCC 
GCCCCAGAGA 
GCCGCCGCGG 
ACCACTGTGA 
ATAAGCTGGA 
GGGAAGGCCT 
GGGCTGGCAC 
GCGGCTCTGG 
CACGTCCTGC 
GGCATTTCCG 
CGCAAACCAG 
GAGAAATCTG 
AAACAGCAAC 
ACATTTCCGT 
CTGTGACATT 
TTTGTACTGC 
TTGTGGTTTG 
TATCACATTA 
TAACCTGGTT 
TAACATTTCA 
AGAAGATCAA 
ATCTCCAACC 
AGCGCTTCAG 
AATACATGTT 
CATGAACAAT 
GATTTCTGCT 
TGATGTAATT 
AAGTAATGAA 
CTATGCTGTG 
GCTTAAGTTG 
GAAAGTAAAA 
TGCCAGCCCA 
CCCAGATGCT 
TGGCATCACC 
CATTGTTCTG 
CTATAACCTC 
CAGTGACAAT 
TGAGCACATC 
TGAGTACATG 
GCTGATGGCT 
CCAGCAGATC 
GGCCACCAGG 
GTCCCGGGAC 
TCGCTGGATG 
GAGCCTGGGG 
GTCAAACAAT 
GTGCCCCCAG 
GAAGAACATC 
CCTGGACATT 
GACGGGCTGA 
TCACTCTGAC 
TTCTTCATCC 
TCTCCCTTGG 
TCCCTGCTTC 
AC T CTG CAT A 
TGCCCACCAC 
GGAAAACAAA 
ATGGATTCAC 
GCCTGTGTAT 
AAAACCAGAG 
CTGGGATCAG 
AATGTATTCG 
GTGCCATGGA 
TGGCTTCCGT 
GTTGTGATGA 
AGTTGAAAAG 



51 
I 

CCCGGCGGTA 60 

GGCCT CGAGG 120 

GTCCCGGACG 18 0 

AGCTCCGAGC 240 

ACCCTGCCGC 3 00 

CTCGGCACGC 3 60 

CCCCGCACGG 42 0 

TGGCTGCTAG 480 

GGCTTCTGCT 540 

AAATGCAGTG 600 

AGATTGGAGC 660 

AAAAGGTTAG 720 

ACAATTGTGG 780 

CTGCAGCACA 840 

CACCTTGACT 90 0 

ATGTGGATCA 960 

CTGAATGAAA 1020 

CCATCTGCAA 1080 

TCCTGTAGTG 1140 

TCCAAACATA 12 00 

TCCGATGACA 12 60 

GATTCTGTCA 132 0 

TCAGACCACC 13 80 

TGGTTCTATA 1440 

ACCAATCACA 1500 

GGGGACTACA 1560 

CACTTCATGG 162 0 

TATGAAGATT 1680 

ATCCCTTCCA 1740 

GTGGTGATTG 1800 

GCAAGACACT 1860 

TCAAGACAAG 192 0 

CTCCATCACA 1980 

GTCATTATTG 2 040 

AACAGTCAGC 2100 

AAAAGGG AG C 2160 

TGTCCTGAGC 222 0 

GCACGCAAGG 22 80 

GTCAAGTTCT 2 340 

AAGCATGGGG 240 0 

GAGGGCAACC 24 60 

GCCGCGGGCA 2 520 

AACTGCCTGG 2580 

GTGTACAGCA 2640 

CCT CCAGAG A 2 700 

GTCGTGTTGT 2760 

GAGGTGATAG 2 820 

GAGGTGTATG 2880 

AAGGGCATCC 2940 

CTAGGCTAGG 3 000 

GAGGATGAAC 3060 

AGTATTAACA 312 0 

ATAGACACAG 3180 

TTGTTCCTTT 3240 

ACGATTCTTA 3 3 00 

GACAAAGGCC 33 60 

AACTAACAAT 3420 

TATTTCACTT 3480 

TTCTATTTAT 3 540 

AAAAAAGAAA 3 600 

AG AAAGAAGA 3 660 

CTGGTGTCAG 3720 

GCACCTTCCC 3780 

TGATTCTTTT 3840 

GAGACACAAG 3 900 

TAGCACTGGT 3 960 

AGGTGGATTC 4 02 0 



80 



85 



Seq ID NO: 597 Protein sequence 
Protein Accession #: AAL67965.1 

1 11 21 31 41 51 

l I l I I l 

MSSWIRWHGP AMARLWGFCW LWGFWRAAF ACPTSCKCSA SRIWCSDPSP GIVAFPRLEP 60 

NSVDPENITE IFIANQKRLE IINEDDVEAY VGLRNLTIVD SGLKFVAHKA FLKNSNLQHI 120 

NFTRNKLTSL SRKHFRHLDL SELILVGNPF TCSCDIMWIK TLQEAKSSPD TQDIiYCLNES 180 

SKNIPLANLQ IPNCGLPSAN LAAPNLTVEE GKSITLSCSV AGDPVPNMYW DVGNLVSKHM 240 



418 



WO 02/086443 

NETSHTQGSL RITNISSDDS 
WCIPFTVKGN PKPALQWFYN 
LIAKNEYGKD EKQISAHFMG 
DVTDKTGREH LSVYAVWIA 
VGPASVISND DDSASPLHHI 
KPDTFVQHIK RHNIVLKREL 
FHREAELLTN LQHEHIVKFY 
PTELTQSQML HIAQQIAAGM 
DYYRVGGHTM LPIRWMPPES 
CITQGRVLQR PRTCPQEVYE 



GKQISCVAEN LVGEDQDSVN 
GAILNESKYI CTK I HVTNHT 
WPGIDDGANP NYPDVIYEDY 
SWGFCIiLVM IiFLIiKLARHS 
SNGSNTPSSS EGGPDAVIIG 
GEGAFGKVFL AECYNIiCPEQ 
GVCVEGDPLI MVFEYMKHGD 
VYLASQHFVH RDLATRNCLV 
IMYRKFTTES DVWSLGWLW 
LMLGCWQREP HMRKNIKGIH 



LTVHFAPTIT FLESPTSDHH 
EYHGCLQLDN PTHMNNGDYT 
GTAANDIGDT TNRSNEIPST 
KFGMKDFSWF GFGKVKSRQG 
MTKIPVIENP QYFGITNSQL 
DKI LVAVKTL KDASDNARKD 
LNKFLRAHGP DAVLMAEGNP 
GENLLVKIGD FGMSRDVYST 
EIFTYGKQPW YQLSNNEVIE 
TIiLQNLAKAS PVYLDILG 



Seq ID NO: 5 98 DNA sequence 
Nucleic Acid Accession #: AB052906 
Coding sequence: 74.. 814 



1 11 21 31 41 51 

l I I l I I 

AAAACCTTGA GGTGATTCAT CTTCCAGGCT CTCCTTCCAT CAAGTCTCTC CTCCCTAGCG 
CTCTGGGTCC TTAATGGCAG CAGCCGCCGC TACCAAGATC CTTCTGTGCC TCCCGCTTCT 
GCTCCTGCTG TCCGGCTGGT CCCGGGCTGG GCGAGCCGAC CCTCACTCTC TTTGCTATGA 
CATCACCGTC ATCCCTAAGT TCAGACCTGG ACCACGGTGG TGTGCGGTTC AAGGCCAGGT 
GGATGAAAAG ACTTTTCTTC ACTATGACTG TGGCAACAAG ACAGTCACAC CTGTCAGTCC 
CCTGGGGAAG AAACTAAATG TCACAACGGC CTGGAAAGCA CAGAACCCAG TACTGAGAGA 
GGTGGTGGAC ATACTTACAG AGCAACTGCG TG AC AT T CAG CTGGAGAATT ACACACCCAA 
GGAACCCCTC ACCCTGCAGG CCAGGATGTC TTGTGAGCAG AAAGCTGAAG GACACAGCAG 
TGGATCTTGG CAGTTCAGTT TCGATGGGCA ' GATCTTCCTC CTCTTTGACT CAGAGAAGAG 
AATGTGGACA ACGGTT CAT C CTGGAGCCAG AAAGATGAAA GAAAAGTGGG AGAATGACAA 
GGTTGTGGCC ATGTCCTTCC ATTACTTCTC AATGGGAGAC TGTATAGGAT GGCTTGAGGA 
CTTCTTGATG GGCATGGACA GCACCCTGGA GCCAAGTGCA GGAGCACCAC TCGCCATGTC 
CTCAGGCACA ACCCAACTCA GGGCCACAGC CACCACCCTC ATCCTTTGCT GCCTCCTCAT 
CATCCTCCCC TGCTTCATCC TCCCTGGCAT CTGAGGAGAG TCCTTTAGAG TGACAGGTTA 
AAGCTGATAC CAAAAGGCTC CTGTGAGCAC GGTCTTGATC AAACTCGCCC TTCTGTCTGG 
CCAGCTGCCC ACGACCTACG GTGTATGTCC AGTGGCCTCC AGC AGAT CAT GATGACATCA 
TGGACCCAAT AGCTCATTCA CTGCCTTGAT TCCTTTTGCC AACAATTTTA CCAGCAGTTA 
TACCTAACAT ATTATGCAAT TTTCTCTTGG TGCTACCTGA TGGAATTCCT GCACTTAAAG 
TTCTGGCTGA CTAAACAAGA TATATCATTT TCTTTCTTCT CTTTTTGTTT GGAAAATCAA 
GTACTTCTTT GAATGATGAT CTCTTTCTTG CAAATGATAT TGT CAGTAAA ATAATCACGT 
TAGACTTCAG ACCTCTGGGG ATTCTTTCCG TGT CCTGAAA GAGAATTTTT AAATTATTTA 
ATAAGAAAAA ATTTATATTA ATGAT TGTTT CCTTTAGTAA TTTATTGTTC TGTACTGATA 
TTTAAATAAA GAGTTCTATT TCCCAAAAAA AAAAAAAAAA AA 

Seq ID NO: 599 Protein sequence 
Protein Accession #: BAB61048.1 



1 11 21 

I I i 

MAAAAATKIL LCLPLLLLLS GWSRAGRADP 

FLHYDCGNKT VTPVSPLGKK LNVTTAWKAQ 

LQARMSCEQK AEGHSSGSWQ FSFDGQIFLL 

SFHYFSMGDC IGWLEDFLMG MDSTLEPSAG 
FILPGI 



31 41 51 

I 1 1 

HSLCYDITVI PKFRPGPRWC AVQGQVDEKT 

NPVLREWDI LTEQLRDIQL ENYTPKEPLT 

FDSEKRMWTT VHPGARKMKE KWENDKWAM 

APLAMSSGTT QLRATATTLI LCCLLIILPC 



Seq ID NO: 600 DNA sequence 

Nucleic Acid Accession #: NM_001898.1 

Coding sequence: 57.. 482 



1 11 21 31 41 51 

I I I I I I 

GGCTCTCACC CTCCTCTCCT GCAGCTCCAG CTTTGTGCTC TGCCTCTGAG GAGACCATGG 

CCCAGTATCT GAGTACCCTG CTGCTCCTGC TGGCCACCCT AGCTGTGGCC CTGGCCTGGA 

GCCCCAAGGA GGAGGATAGG ATAATCCCGG GTGGCATCTA TAACGCAGAC CTCAATGATG 

AGTGGGTACA GCGTGCCCTT CACTTCGCCA TCAGCGAGTA TAACAAGGCC ACCAAAGATG 

ACTACTACAG ACGT CCGCTG CGGGTACTAA GAG CCAGG CA ACAGACCGTT GGGGGGGTGA 

ATTACTTCTT CGACGTAGAG GTGGGCCGCA CCATATGTAC CAAGTCCCAG CCCAACTTGG 

ACACCTGTGC CTTCCATGAA CAGCCAGAAC TGCAGAAGAA ACAGTTGTGC TCTTTCGAGA 

TCTACGAAGT TCCCTGGGAG AACAGAAGGT CCCTGGTGAA ATCCAGGTGT CAAGAATCCT 

AGGGATCTGT GCCAGGCCAT TCGCACCAGC CACCACCCAC TCCCACCCCC TGTAGTGCTC 

CCACCCCTGG ACTGGTGGCC CCCACCCTGC GGGAGGCCTC CCCATGTGCC TGCGCCAAGA 

GACAGACAGA GAAGGCTGCA GGAGTCCTTT GTTGCTCAGC AGGGCGCTCT GCCCTCCCTC 

CTTCCTTCTT GCTTCTAATA GCCCTGGTAC ATGGTACACA CCCCCCCACC TCCTGCAATT 

AAACAGTAGC ATCGCC 



Seq ID NO: 601 Protein sequence 
Protein Accession #: NP 001889.1 



1 11 21 31 41 51 

l I l l I I 

MAQYLSTLhh LLATLAVALA WSPKEEDRII PGGIYNADLN DEWVQRALHF AISEYNKATK 
DDYYRRPLRV LRARQQTVGG VNYFFDVEVG RTICTKSQPN DDTCAFHEQP ELQKKQLCSF 
E I YEVPWENR RSLVKSRCQE S 



Seq ID NO: 602 DNA sequence 

Nucleic Acid Accession #: NM_003976.2 

Coding sequence: 2 99.961 

1 11 21 31 41 51 



419 



WO 02/086443 

CTCTGAGCTT CTCTGAGCCT 
CATGGAGTTG TGAAAGAATA 
CTACTTCTGC TGGGTTGAGT 
GGGTGGCAGG CCGGTCCCCC 
CAGGAGGGTG GGGGAACAGC 
GGAACTTGGA CTTGGAGGCC 
TGCCCTGTGG CCCACCCTGG 
GGGCTCCGCG CCCCGCAGCC 
CGCCGGCCAC CTGCCGGGGG 
GCCGCCGCAG CCTTCTCGGC 
CGGGGGCCGC GCGGCGCGGG 
GGGCTGCCGC CTGCGCTCGC 
CGACGAGCTG GTGCGTTTCC 
CGACCTCAGC CTGGCCAGCC 
GCCCGTCAGC CAGCCCTGCT 
CAACAGCACC TGGAGAACCG 
AGGGCTCGCT CCAGGGCTTT 
CCTCCCGCAG AGT CCCACTA 
AGGCCCCTAC CGGTGGGTGA 
CAGCCCCAGA GCCCTCACCC 
GGAGCCCTTC GGACCCACTT 
CCCTCCTCTG ATGAACACTA 
ACAGCATTTG AAGGACACAT 
CCTGTACTCA CTCATGGGAG 



TGTTTGCTCA TCTGGAAAAA 
GCTGCAAAGC ACCTAACACA 
CTAGCTGTGT AGGCCCCTTG 
ACAAAAGATA ACTCATCTCT 
TCAACAATGG CTGATGGGCG 
TCTCCACGCT GTCCCACTGC 
CCGCTCTGGC TCTGCTGAGC 
CTGCCCCCCG CGAAGGCCCC 
GACGCACGGC CCGCTGGTGC 
CCGCGCCCCC GCCGCCTGCA 
CTGGGGGCCC GGGCAGCCGC 
AGCTGGTGCC GGTGCGCGCG 
GCTTCTGCAG CGGCTCCTGC 
TACTGGGCGC CGGGGCCCTG 
GCCGACCCAC GCGCTACGAA 
TGGACCGCCT CTCCGCCACC 
GCAGACTGGA CCCTTACCGG 
GCCAGCGGCC TCAGCCAGGG 
TGGAT AT CAT CCCCGAACAG 
TGCGGATCCC AGCCTAAAAG 
CTCACAGACT CTGGCACTGG 
CAGTGGCTGA GGCAT CAGCC 
ATTGCAGTTG CTTGGTTGAA 
CTGGCCCC 



GGGGATTAAA CCATTTACCT 
TAGTAAGGTT CCCAGTGCAG 
TTCCTCACCT GGAGAAACTG 
TAATTTGCAA GCTGCCTCAA 
CTCCTGGTGT TGATAGAGAT 
CCCTGGCCTA GGCGGCAGCC 
AGCGTCGCAG AGGCCTCCCT 
CCGCCTGTCC TGGCGTCCCC 
AGTGGAAGAG CCCGGCGGCC 
CCCCCATCTG CTCTTCCCCG 
GCTCGGGCAG CGGGGGCGCG 
CTCGGCCTGG GCCACCGCTC 
CGCCGCGCGC GCTCTCCACA 
CGACCGCCCC CGGGCTCCCG 
GCGGTCTCCT TCATGGACGT 
GCCTGCGGCT GCCTGGGCTG 
TGGCTCTTCC TGCCTGGGAC 
ACGAAGGCCT CAAAGCTGAG 
GTGAAGGGAC AACTGACTAG 
ACACCAGAGA CCTCAGCTAT 
CCAGGCCTCG AACCTGGGAC 
CCCGCCCAGG CCCTGTAGGG 
AGTGCCTGTG CTGGAACTGG 



Seq ID NO: 603 Protein sequence 
Protein Accession #: NP 003967.1 



1 11 21 31 41 51 

I I I l I l 

MELGLGGLST LSHCPWPRRQ PALWPTLAAL ALLSSVAEAS LGS APRS PAP REGPPPVLAS 

PAGHLPGGRT ARWCSGRARR PPPQPSRPAP PPPAPPSALP RGGRAARAGG PGSRARAAGA 

RGCRLRSQLV PVRALGLGHR SDELVRFRFC SGSCRRARSP HDLSLASLLG AGALRPPPGS 

RPVSQPCCRP TRYEAVSFMD VNSTWRTVDR LSATACGCLG 



Seq ID NO: 604 DNA sequence 

Nucleic Acid Accession #: NM_057091.1 

Coding sequence: 783.. 1445 



1 11 

I I 

ACTGGCCGCT GAGAGAAGAA 

GGACCCCCAA ATCTGCACGT 
TCGCTCCCCG CCCTCACTCA 
CGCGTGTCTA CAAACTCAAC 
CTCCATATCC GAGGGGCCCC 
CAAGCTAGGG GGGACTGGAT 
CGGGGCAGGG GCGCTCCCAG 
CACCGGACGG CTGCGGCGGC 
CAGACAAGGC CCGGGGGCTC 
CCCGGGCCTG GAGCCCCACA 
TAAAAGAGGC ACTGCCAGGT 
GCCCAGCACT GGTCCCCGGA 
TCAACAGGAG GGTGGGGGAA 
AGATGGAACT TGGACTTGGA 
AGCCTGCCCT GTGGCCCACC 
CCCTGGGCTC CGCGCCCCGC 
CCCCCGCCGG CCACCTGCCG 
GGCCGCCGCC GCAGCCTTCT 
CCCGCGGGGG CCGCGCGGCG 
CGCGGGGCTG CCGCCTGCGC 
GCTCCGACGA GCTGGTGCGT 
CACACGACCT CAGCCTGGCC 
CCCGGCCCGT CAGCCAGCCC 
ACGTCAACAG CACCTGGAGA 
GCTGAGGGCT CGCTCCAGGG 
GGACCCTCCC GCAGAGTCCC 
TGAGAGGCCC CTACCGGTGG 
CTAGCAGCCC CAGAGCCCTC 
CTATGGAGCC CTTCGGACCC 
GGACCCCTCC TCTGATGAAC 
AGGGACAGCA TTTGAAGGAC 
CTGGCCTGTA CTCACTCATG 



21 31 

! I 

TCGGGTGGAG CAGAGAGCAG 
ACCAGCAGTC AGCCGCCCCA 
CTTTCTCCCG CCCTCGGCCC 
TCCCGGTTTC CGTGCCTCTC 
TCCCAGCATC TACCCCCCTC 
CCGACGGGTG GAGCAGCCAG 
CCCCACCCCG GGATCTGGTG 
GGGCAGGAGG CTGCTGAGGG 
CGCCAGCAGC AGGTCCCTCG 
CCCGAGGGTG CAGACTGGCT 
GTACAGTCCT GGGCATGCGC 
AAGGTGCCTA GAAGAACAAG 
CAGCTCAACA ATGGCTGATG 
GGCCTCTCCA CGCTGTCCCA 
CTGGCCGCTC TGGCTCTGCT 
AGCCCTGCCC CCCGCGAAGG 
GGGGGACGCA CGGCCCGCTG 
CGGCCCGCGC CCCCGCCGCC 
CGGGCTGGGG GCCCGGGCAG 
TCGCAGCTGG TGCCGGTGCG 
TTCCGCTTCT GCAGCGGCTC 
AGCCTACTGG GCGCCGGGGC 
TGCTGCCGAC CCACGCGCTA 
ACCGTGGACC GCCTCTCCGC 
CTTTGCAGAC TGGACCCTTA 
ACTAGCCAGC GGCCTCAGCC 
GTGATGGATA TCATCCCCGA 
ACCCTGCGGA TCCCAGCCTA 
ACTTCTCACA GACTCTGGCA 
ACTACAGTGG CTGAGGCATC 
ACATATTGCA GTTGCTTGGT 
GGAGCTGGCC CC 



41 51 

I ! 

CTGCTGCAGG GCAGACAGCC 
CGCAGGGACC GGCTTACCCC 
GGCCTCCCAG CTCTCTACTT 
CACCGCTCGA GTTCTCTACT 
CCAACCTCGG GGGACCTAGC 
GTGAGCCCCG AAAGGTGGGG 
ACGCTGGGGC TGGAATTTGA 
ATGGAGTTGG GCCCGGCCCC 
GGCCCCAGCC CTCGCTGCCA 
GCCAAGGCCA CACTTTTGGC 
TGTTTGAGCT TCGGGGGAGA 
GTGCAGGACC CCGTGCTGCC 
GGCGCTCCTG GTGTTGATAG 
CTGCCCCTGG CCTAGGCGGC 
GAGCAGCGTC GCAGAGGCCT 
CCCCCCGCCT GTCCTGGCGT 
GTGCAGTGGA AGAGCCCGGC 
TGCACCCCCA TCTGCTCTTC 
CCGCGCTCGG GCAGCGGGGG 
CGCGCTCGGC CTGGGCCACC 
CTGCCGCCGC GCGCGCTCTC 
CCTGCGACCG CCCCCGGGCT 
CGAAGCGGTC TCCTTCATGG 
CACCGCCTGC GGCTGCCTGG 
CCGGTGGCTC TTCCTGCCTG 
AGGGACGAAG GCCTCAAAGC 
ACAGGTGAAG GGACAACTGA 
AAAGACACCA GAGACCTCAG 
CTGGCCAGGC CTCGAACCTG 
AGCCCCCGCC CAGGCCCTGT 
TGAAAGTGCC TGTGCTGGAA 



Seq ID NO: 605 Protein sequence 
Protein Accession #: NP 003 967.1 



1 
I 

MELGLGGLST 
PAGHLPGGRT 
RGCRLRSQLV 
RPVSQPCCRP 



11 
I 

LSHCPWPRRQ 
ARWCSGRARR 
PVRALGLGHR 
TRYEAVSFMD 



21 
I 

PALWPTLAAL 
PPPQPSRPAP 
SDELVRFRFC 
VNSTWRTVDR 



31 
I 

ALLSSVAEAS 
PPPAPPSALP 
SGSCRRARSP 
LSATACGCLG 



41 
1 

LGSAPRSPAP 
RGGRAARAGG 
HDLSLASLLG 



51 
I 

REGPPPVLAS 
PGSRARAAGA 
AGALRPPPGS 



Seq ID NO: 606 DNA sequence 

Nucleic Acid Accession #: NM 057160.1 



420 



WO 02/086443 

Coding sequence: 1..714 

1 11 21 31 41 51 

I i l I I I 

ATGCCCGGCC TGATCTCAGC CCGAGGACAG CCCCTCCTTG AGGTCCTTCC TCCCCAAGCC 

CACCTGGGTG CCCTCTTTCT CCCTGAGGCT CCACTTGGTC TCTCCGCGCA GCCTGCCCTG 

TGGCCCACCC TGGCCGCTCT GGCTCTGCTG AGCAGCGTCG CAGAGGCCTC CCTGGGCTCC 

GCGCCCCGCA GCCCTGCCCC CCGCGAAGGC CCCCCGCCTG TCCTGGCGTC CCCCGCCGGC 

CACCTGCCGG GGGGACGCAC GGCCCGCTGG TGCAGTGGAA GAGCCCGGCG GCCGCCGCCG 

CAGCCTTCTC GGCCCGCGCC CCCGCCGCCT GCACCCCCAT CTGCTCTTCC CCGCGGGGGC 

CGCGCGGCGC GGGCTGGGGG CCCGGGCAGC CGCGCTCGGG CAGCGGGGGC GCGGGGCTGC 

CGCCTGCGCT CGCAGCTGGT GCCGGTGCGC GCGCTCGGCC TGGGCCACCG CTCCGACGAG 

CTGGTGCGTT TCCGCTTCTG CAGCGGCTCC TGCCGCCGCG CGCGCTCTCC ACACGACCTC 

AGCCTGGCCA GCCTACTGGG CGCCGGGGCC CTGCGACCGC CCCCGGGCTC CCGGCCCGTC 

AGCCAGCCCT GCTGCCGACC CACGCGCTAC GAAGCGGTCT CCTTCATGGA CGTCAACAGC 

ACCTGGAGAA CCGTGGACCG CCTCTCCGCC ACCGCCTGCG GCTGCCTGGG CTGAGGGCTC 

GCTCCAGGGC TTTGCAGACT GGACCCTTAC CGGTGGCTCT TCCTGCCTGG GACCCTCCCG 

CAGAGTCCCA CTAGCCAGCG GCCTCAGCCA GGGACGAAGG CCTCAAAGCT GAGAGGCCCC 

TACCGGTGGG TGATGGATAT CATCCCCGAA CAGGTGAAGG GACAACTGAC TAGCAGCCCC 

AGAGCCCTCA CCCTGCGGAT CCCAGCCTAA AAGACACCAG AGACCTCAGC TATGGAGCCC 
TTCGGACCCA CTTCTCACAG ACTCTGGCAC TGGCCAGGCC TCGAACCTGG GACCCCTCCT 
CTGATGAACA CTACAGTGGC TG AGG CAT C A GCCCCCGCCC AGGCCCTGTA GGG AC AG CAT 
TTGAAGGACA CATATTGCAG TTGCTTGGTT GAAAGTGCCT GTGCTGGAAC TGGCCTGTAC 

TCACTCATGG GAGCTGGCCC C 



Seq ID NO: 607 Protein sequence 
Protein Accession #: NP 476501.1 



1 11 21 31 41 51 

I I I I I I 

MPGLISARGQ PLLEVLPPQA HLGALFLPEA PLGLSAQPAL WPTLAALALL SSVAEASLGS 

APRSPAPREG PPPVLASPAG HLPGGRTARW CSGRARRPPP QPSRPAPPPP APPSALPRGG 

RAARAGGPGS RARAAGARGC RLRSQLVPVR ALGLGHRSDE LVRFRFCSGS CRRARSPHDL 

SLASLLGAGA LRPPPGSRPV SQPCCRPTRY EAVSFMDVNS TWRTVDRLSA TACGCLG 



Seq ID NO: 608 DNA sequence 

Nucleic Acid Accession #: NM_0570 90.1 

Coding sequence: 29.. 715 



1 11 21 31 41 51 

I I I I l I 

CTGATGGGCG CTCCTGGTGT TGATAGAGAT GGAACTTGGA CTTGGAGGCC TCTCCACGCT 
GTCCCACTGC CCCTGGCCTA GGCGGCAGGC TCCACTTGGT CTCTCCGCGC AGCCTGCCCT 
GTGGCCCACC CTGGCCGCTC TGGCTCTGCT GAGCAGCGTC GCAGAGGCCT CCCTGGGCTC 
CGCGCCCCGC AGCCCTGCCC CCCGCGAAGG CCCCCCGCCT GTCCTGGCGT CCCCCGCCGG 
CCACCTGCCG GGGGGACGCA CGGCCCGCTG GTGCAGTGGA AGAGCCCGGC GGCCGCCGCC 
GCAGCCTTCT CGGCCCGCGC CCCCGCCGCC TGCACCCCCA TCTGCTCTTC CCCGCGGGGG 
CCGCGCGGCG CGGGCTGGGG GCCCGGGCAG CCGCGCTCGG GCAGCGGGGG CGCGGGGCTG 
CCGCCTGCGC TCGCAGCTGG TGCCGGTGCG CGCGCTCGGC CTGGGCCACC GCTCCGACGA 
GCTGGTGCGT TTCCGCTTCT GCAGCGGCTC CTGCCGCCGC GCGCGCTCTC CACACGACCT 
CAGCCTGGCC AGCCTACTGG GCGCCGGGGC CCTGCGACCG CCCCCGGGCT CCCGGCCCGT 
CAGCCAGCCC TGCTGCCGAC CCACGCGCTA CGAAGCGGTC TCCTTCATGG ACGT CAACAG 
CACCTGGAGA ACCGTGGACC GCCTCTCCGC CACCGCCTGC GGCTGCCTGG GCTGAGGGCT 
CGCTCCAGGG CTTTGCAGAC TGGACCCTTA CCGGTGGCTC TTCCTGCCTG GGACCCTCCC 
GCAGAGTCCC ACTAGCCAGC GGCCTCAGCC AGGGACGAAG GCCTCAAAGC TGAGAGGCCC 
CTACCGGTGG GTGATGGATA TCATCCCCGA ACAGGTGAAG GGACAACTGA CTAGCAGCCC 
CAGAGCCCTC ACCCTGCGGA TCCCAGCCTA AAAGACACCA GAGACCTCAG CTATGGAGCC 
CTTCGGACCC ACTTCTCACA GACTCTGGCA CTGGCCAGGC CTCGAACCTG GGACCCCTCC 
TCTGATGAAC ACTACAGTGG CTGAGGCATC AGCCCCCGCC CAGGCCCTGT AGGGACAGCA 
TTTGAAGGAC ACATATTGCA GTTGCTTGGT TGAAAGTGCC TGTGCTGGAA CTGGCCTGTA 
CTCACTCATG GGAGCTGGCC CC 



Seq ID NO: 609 Protein sequence 
Protein Accession #: NP_476431.1 

1 11 21 31 41 51 

I I I I I 1 

MELGLGGLST LSHCPWPRRQ APLGLSAQPA LW PTLAALAL LSSVAEASLG SAPRSPAPRE 

GPPPVLASPA GHLPGGRTAR WCSGRARRPP PQPSRPAPPP PAPPSALPRG GRAARAGGPG 
SRARAAGARG CRLRSQLVPV RALGLGHRSD ELVRFRFCSG SCRRARSPHD LSLASLLGAG 

ALRPPPGSRP VSQPCCRPTR YEAVS FMDVN STWRTVDRLS ATACGCLG 



Seq ID NO: 610 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..1746 



1 11 

1 I 
ATGCCACTGA AGCATTATCT 

GCCTACCATG GCTGCCCTAG 

GGGGCACGCA TTGTGGCGGT 

CTCAACACGC ACATCACTGA 

GCCCTGAGGA TTGAGAAGAA 

GGCTCGCTGC GCTATCTCAG 

TTCCAGGGCC TGGACAGCCT 

CAGCCGGCCC ACTTCTCCCA 

CTGGAATACA TCCCTGACGG 



21 31 

1 I 
CCTTTTGCTG GTGGGCTGCC 

CGAGTGTACC TGCTCCAGGG 

GCCCACCCCT CTGCCCTGGA 

ACTCAATGAG TCCCCGTTCC 

TGAGCTGTCG CGCATCACGC 

CCTCGCCAAC AACAAGCTGC 

TGAGTCTCTC CTTCTG TCCA 

GTGCAGCAAC CTCAAGGAGC 

AGCCTTCGAC CACCTGGTAG 



41 51 

I I 
AAGCCTGGGG TGCAGGGTTG 

CCTCCCAGGT GGAGTGCACC 

ACGCCATGAG CCTGCAGATC 

TCAATATCTC AGCCCTCATC 

CTGGGGCCTT CCGAAACCTG 

AGGTTCTGCC CATCGGCCTC 

GTAACCAGCT GTTGCAGATC 

TGCAGTTGCA CGGCAACCAC 

GACTCACGAA GCTCAATCTG 
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WO 02/086443 

GGCAAGAATA GCCTCACCCA 
GTCCTCCGGC TGTATGAGAA 
GTTAACCTGC AGGAACTGGC 
TTCCACAACA ACCACAACCT 
CCACCCAGCA TCTTCATGCA 
CTGAAGGAGC TCTCTCTGGG 
TATGACAACC ACATCTCTTC 
GTCCTGATTC TTAGCCGCAA 
ACGGAGCTTC GGGAGCTGTC 
TTCCGCATGT TGGCCAACCT 
CCAGGGAATA TCTTCGCCAA 
CTGGAGAACT TGCCCCTCGG 
TATGACAATC CCTGGAGGTG 
AACCAGCCTA GGTTAGGGAC 
GGCCAGTCCC TCATTATCAT 
GTGCCTAGTT ACCCAGAAAC 
TCCGTCTCTT CTACCACTGA 
ATTCAGGTCA CTGATGACCG 
ATTGCCGCCA TTGTAATTGG 
TGTTGCTGCT GCAAGAAGAG 
TGTTAAAGAG GCAGGCTGGA 
TCATCTTTCT GCCTCCACCC 
CTAGATAAAG GTGTGCCTAC 
CGTGCCGGAC CTTCCTACAA 
GGATTTCCGA TTCATACCCC 
ACCTGTCCTC CAAGAACAGC 
AGTTAGT CC A CAGCCTGCTC 
CCTAAGTATT ATGTAAGTTG 
ACCCAGCATG TCCCCTCAAA 
TGAGTTCTCT CCTCAAAGAA 
CAGCCTGGTT TTGGGGATGC 
AGACAGAAGA GCCGTCATCA 
CCCCAGCACA GCAAGCTCAG 
TGAAAAGTTT AGCCCTTTAA 
AAAAT CAGCT TATTAATACG 
CACCCCTAGA GTTTGTTTTA 
GTGGGAACAT GATAGTGTAT 
CAG CAT CT AG ACCCAGACCC 
GGAGATGGGG GCTTCTGAAG 
TCCCCCCACA GTCAGCCTGT 
TGTGGACAGG ATGGGAGACT 
AGAGACCCTG AGACCTGGGG 
GTCCGTGCAG CCACACCCTC 
TCCGCCTGGA GCCTTCTATG 
ACTTAGGGGA AGTGAAAT CG 
GAATCTAGTG TCTTTCTAAT 
TGAACTTCAG AATCTCACTT 
GTCTGGGGGC TCCCTGGAGC 
TCCAGGGTTA TTCTCCTCCT 
CTGCTATACA CATATTCACA 
CTCTGGACAA CTGGCCCAGT 
AGGAAAGAAC TTCAGCTGAC 
TCTTATTAGC TCCCCGCTCC 
TCGGCTCTTA TTAGCTCCCC 
CCCGATCGGC TCTTATTAGC 
CAGGAGCACG TGCTGACCAG 
TGTTTGCAAA CACTAGTGCA 
AGATGAGGCC CGTCAGAGTC 
ACTATTGGTG GCACCTGGAG 
CCAGAGCATG GCACATGAGC 
GGGGCATCCC GGCCCGTACC 
GGTGCTCCTG TGAGTGGCCT 
GAGGGAGGTG GGAAACCTCA 
GGTATTCCTG GCAGTAGCCA 
GAGGGCCACT GTCCTCAGAT 
CCTTATGTGA ACCTCTTGCC 
GCCTCCTTTT CTTCAGCGGG 
TACTAGAAAA GCTGAGTGGA 
GGGCTGGAAT GAGCCGGCTG 
CCTCTCTGTT TACAGCTCCT 
GTGTTGGAGA AGAAACAACA 
TGCACAGATA CTCTTCAAGC 
GGTAGGAGTG CCGCCTCTAC 
GGTGTTCAAT AGGCTGGGAG 
TTGTCTTGGG CTTTCGTCAT 
TTAGTCTTGG TCATCAGAAC 
GGAAAAAATA AACTCTTCCA 
TGGGCTGTAT GTATATTGTT 
AACTTTTCAT GGACACAATT 
GAACTTCCAA ACTCAGGAAG 
AGTTGGTCGA CAGATGTTAG 
GCCCCCAGAT CCCACAGTCA 
GGAAGGAAGC CATGGCTGTG 
CTCCTTCCGC CCCAGGTTTC 
CTTCATGCTG CCTTCAAAGC 
GCCCCAGTGC TTGGCGATGC 
AGCCCTGGTG GGCAGGGTTG 



PCT/US02/12476 



CATCTCACCC 
CAGGCTCACG 
TCTACAGCAG 
CCAGAGACTC 
GCTGCCCCAG 
GATCTTCGGG 
TCTACCCGAC 
TCAGATCAGC 
CCTCCACACC 
GCAGAACATC 
CGT CAATGGC 
CATCTTCGAT 
TGACTCAGAC 
GGACACTGTA 
CAATGT CAAC 
ACCATGGTAC 
GCTAACCAGC 
CAGCGTTTGG 
CATTGTCGCC 
GAGCCAAGCT 
GCAGGGCTGG 
CTGGGTCCAT 
CTCTTCCTGA 
TCAGGAAGAT 
TGGGCTTCCT 
CTTCCCTGCG 
ACTTCGTGGG 
ATTTCCCTTC 
TGAAAGTTCT 
GACTTCAAAC 
TATGAAAGAG 
GTGTCTCACT 
CCTTTTAGAG 
GGAATGAAAT 
GGATAGAGAA 
AAATTTTTAA 
GGCTTGGTGG 
AGAGCATCAC 
ATGGACTTAC 
GCAAAGGCCC 
GTGGCCTGAA 
CACCATGGCT 
TTCCCTGCCA 
GACGTGATAT 
CTCAGAGATG 
GTGGTAAAAT 
ACAGCAGGCG 
TCCTCCTGCG 
CGAGTCACAG 
TGGCGCTCAA 
TTACAGTGAA 
TCCACGGGGA 
ACAAGACACC 
GCTCCACAAG 
TCCCCGCTCC 
TTTTCCCTTC 
CTTTGTAGCT 
AAGAGATGTC 
GACATGCACC 
ATCACCCGCT 
CCTCCAGACA 
CCAGATGTCT 
TCATCCGGTG 
TGACATTGGA 
GACACCACCC 
TCTTCCTTTC 
CCCTTCAACC 
GTCTCCTTTC 
GTCCCCCAGA 
TGACAGTCCC 
AAAGCCAATT 
ACTGGACGTG 
CCACTTGTGA 
TTTTATTTAT 
TAAACCAAAG 
CTCACTTGGT 
TCCCTTAAAG 
CTTCCTCCTT 
TCCACAACCT 
TTTGCAGAGA 
ATGT AT CCT A 
GAACTGAATC 
GTTCAGAGAG 
TTCTTCTCTT 
T AGAT C ATGT 
ATTTACAGAT 
GGGGGTCTGT 



AGGGTCTTCC 
GATATCCCCA 
AACCAGATTG 
TACCTGTCCA 
CTCAACCGTC 
CCCATGCCCA 
AATGTCTTCA 
TTCATCTCCC 
AACGCACTGC 
TCCCTGCAGA 
CTCATGGCCA 
CACCTGGGGA 
ATCCTTCCGC 
CCTGTGTGTT 
GTTGCTGTTC 
CCAGACACAC 
CCTGTGGAAG 
GGCATGACCC 
CTGGCCTGCT 
GTCCTGATGC 
GGAATGATGG 
GGAGCTTTCC 
CTTGCCTGAT 
AGATCCAACT 
TCGAGAGGGC 
CCCAGGCCCC 
AATAGTTCTC 
TTTTGTTTCT 
CCCCTTGATT 
CATTTAACTG 
AGAAGGAAAA 
TGTGATTTTT 
AAGGATATTT 
CATGTAGAAT 
AGAAATCTGG 
TTGAAGCATG 
ATTTTCACAA 
AAATATCCCC 
CTGGGACCTG 
CGTGGCCAGG 
CAGGAGATTT 
GGCCAGGTCA 
GCAAGTTGTC 
GCCTGTATCT 
AGATCCTTTA 
TCTCCATCAA 
ACACGGGGGT 
TGTGGTCTGG 
TCACACGAAT 
GAAGTTAGGC 
ATGGAGAATT 
TCTGGAAATC 
TGTGCTTTGG 
ACACCTGTGA 
ACAAGACACC 
CAGTTCCTGC 
TTTCACCCTC 
ATCCCCCCAG 
AAGGCTTGCC 
GATGGTGGCC 
GGAAGCATGG 
TTGTGCATAG 
GGCCCTGCCA 
GCACCTTCCT 
AGGAGCACCC 
TCCCATCAGA 
TCTCTGCACC 
CAACAGGATG 
AAGCTGGAGT 
ACGCCCATCT 
AGAACCACTA 
GATTCTCTCT 
TGGGGTACAG 
CTCTTCAAAC 
GAAATGGAAG 
ACCATATAGA 
AATAGAATAG 
AGAATTTAGA 
TTCAGATGCT 
GCAGACAGCT 
GCTTTTAGCC 
TGCGTTGTTG 
GGTGGGCTGG 
AAGGAGAGAT 
TTGCCTTGCT 
TTCTAGGCCC 
CTTCTGCTGG 



AGCACCTGGG 
TGGGCACTTT 
GACTGCTCTC 
ACAACCACAT 
TTACTCTCTT 
ACCTGCGGGA 
GCAACCTCCG 
CGGGTGCCTT 
AGGACCTGGA 
ACAAT CGCCT 
TCCAGCTGCA 
AACTGTGTGA 
TCCGCAACTG 
TCAGCCCAGC 
CAAGCGTCCA 
CCAGTTACCC 
ACTACACTGA 
AGGCCCAGAG 
CCCTGGCTGC 
AGATGAAGGC 
GACTGGAGGA 
CGTGATTGCT 
TCTCCCGTAG 
GGCCATGGCA 
TCTTCCTCCA 
CTCCGGGCCT 
CGCTGAGATA 
CTTGTTTGTG 
TTCTGCTCCT 
GTTTCTTAAG 
TCATGCCGCT 
ATCTGGAAAA 
CCAAACTGCA 
TTTGGACTTC 
TGCCTGGGGG 
TGAAGTGTAC 
ACTGAACATA 
CATCCTGGGC 
CCCCCCATGA 
GGTGGAGGAG 
TATTATATCT 
GAAGCATCCT 
TGCGGCTCAT 
GTTTTTAATT 
ATTGAAAACG 
CATCACAGTC 
ACACCGATGG 
TTAGGAGTTG 
ACCTGCCTTC 
TCATGGCAAC 
TCAGGTCTCC 
CACGACCAAT 
AAATCCACCA 
TCTGGAAATC 
TGTGACATCC 
ACAAAAAGTG 
TGTCCCAGGG 
GGTCTCCAAG 
AGAGCCAACA 
TGCTGTGCCT 
GTTTGCCCAC 
GCACAAGTGG 
ATCTTAACCC 
CTCCAGCCAG 
TAGGTGAGGG 
GTGGTTGGAT 
ATGTTGTCTG 
ATGCATTTGC 
GGGGTACAGA 
GGAGTGGGAG 
TTTTTAAAAA 
CTAGCCCTCA 
AGGCACTTGC 
TTTGTACAAG 
CCATTCCCCT 
TCAAAAGCTT 
TTTGTCCCTC 
GATACAAGAG 
GATGTAGAGC 
AGAGATAACT 
ATAAACCACT 
GGAAGCCAGC 
CAAGCCACTT 
TGTTCTCACC 
TAGAGAATTA 
TCAGGGTTTT 
ATGCTGCTTG 



CAATCTCCAG 600 

TGATGGGCTT 660 

CCCTGGTCTC 72 0 

CTCCCAGCTG 780 

TGGGAATTCC 840 

GCTTTGGCTC 900 

CCAGTTGCAG 960 

CAACGGGCTA 102 0 

CGGGAATGTC 1080 

CAGACAGCTC 1140 

GAACAACCAG 120 0 

GCTGCGG CTG 12 60 

GCTCCTGCTC 1320 

CAATGTCCGA 13 80 

TGTCCCTGAG 1440 

TGACACCACA 1500 

TCTGACTACC 1560 

CGGGCTGGCC 162 0 

CTGCGTCGGC 1680 

ACCCAATGAG 1740 

CCTGGGAATT 180 0 

CTTTCTGGCC 1860 

AGAAG CAGGT 192 0 

AAAGCCCTGG 1980 

AATCCTCCCC 2 040 

CTGTAGACTC 210 0 

GCCCCTCTCG 2160 

CTATGGCTTG 2220 

GAAGGCAGGG 2280 

AGCCGT CAAT 2 340 

CAGTTCCTGG 240 0 

GGAAGAAACA 2460 

AACTTTGCTT 2 520 

TAAAAACATT 2580 

TCCCTGTGTT 2 640 

STGCAGAAAA 2 700 

CCTGTGTAAT 2760 

TTTTCCCAGA 2 82 0 

GCCAGGACGG 2880 

AATATGTGGG 2 940 

GGAGACCCTG 3 000 

GACTGCAGAG 3 060 

CGGAGGCCCC 312 0 

TTCATTCTTC 3180 

AAGTGTAACG 3 240 

AGCTGGCAGC 33 00 

GTCACACTGG 3360 

AGTTGTTTGC 3420 

TCTGGCTTTC 3480 

GTGTGTCTTT 3540 

ACGTCTGCCC 3 600 

CCCGATCGGC 3 660 

CCAATCCCGA 3 720 

TACCACCAAT 3 7 80 

TCCAGGGCCA 3 840 

T CC AGAGGGC 3900 

AAT CTAGGAG 3 960 

GCATTTCCAC 4020 

GGAAGTGAGC 4 0 80 

GGTGCCAACA 4140 

AGACCTGTCG 42 00 

GCCAGGGCTG 42 60 

AGAACCCTTA 4320 

AGGCTGACCT 43 80 

GTGAGGGCCC 4440 

GGAGCCATTG 4500 

GCTGAGGAGC 4560 

TCAATTCTCA 462 0 

GTTCAGTTTT 4680 

CTGGGAGTTA 4740 

GTGCTTACTG 4800 

GCACCCCTGC 4 860 

TCTTCTGCAT 492 0 

AGCTCATGGC 4980 

GTTGCTCTCC 5040 

TGTAACCACA 5100 

TCATGGGAAT 5160 

TTCTACTTAG 522 0 

TATTGGGAAA 52 80 

CGGGACCCAG 5340 

CAAAGATTCA 5400 

AGTGGCCTTG 5460 

CCGGGGAAAA 552 0 

AACCCGCTGC 5580 

CTGCAAATCA 5640 

GTAGAGTGTG 5700 

TAATCCATTT 5760 



422 



WO 02/086443 

GGTGTACAGA ATCAACAATA AATAATATAC ATGTAT 
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Seq ID NO: 611 Protein sequence 
^ Protein Accession #: BAB84587.1 

1 11 21 31 41 51 

I I I I I 1 

MPLKHYLLLL VGCQAWGAGL AYHGCPSECT CSRASQVECT GARIVAVPTP LPWNAMSLQI 60 

LNTHITELNE SPFLNISALI ALRIEKNELS RITPGAFRNL GSLRYLSLAN NKLQVLPIGL 120 

10 FQGLDSLESL LLSSNQLLQI QPAHFSQCSN LKELQLHGNH LEYIPDGAFD HLVGLTKLNL 180 

GKNSLTHISP RVFQHLGNLQ VLRLYENRLT DIPMGTFDGL VNLQELALQQ NQIGLLSPGL 240 

FHNNHNLQRL YIiSNNHISQL PPSIFMQLPQ LNRLTLFGNS LKELSLGIFG PMPNLRELWL 300 

YDNHISSLPD NVFSNLRQLQ VLILSRNQIS FISPGAFNGL TELRELSLHT NALQDLDGNV 360 

FRMLANLQNI SLQNNRLRQL PGN I FANVNG LMAIQLQNNQ LENLPLGIFD HLGKL CELRL 42 0 

15 YDNPWRCDSD ILPLRNWLLL NQPRLGTDTV PVCFSPANVR GQSLIIINVN VAVPSVHVPE 480 

VPSYPETPWY PDTPSYPDTT SVSSTTELTS PVEDYTDLTT IQVTDDRSVW GMTQAQSGLA 540 
IAAIVIGIVA LACSLAACVG CCCCKKRSQA VLMQMKAPNE C 

Seq ID NO: 612 DNA sequence 
20 Nucleic Acid Accession #: XM_098151 
Coding sequence: 1..447 

1 11 21 31 41 51 

04 - I 1 I ! I I 

ZD ATGATGCATT TGCTCAATTC TCAGGGCTGG AATGAGCCGG CTGGTCCCCC AGAAAGCTGG 60 

AGTGGGGTAC AGAGTT CAGT TTTCCTCTCT GTTTACAGCT CCTTGACAGT CCCACGCCCA 120 

TCTGGAGTGG GAGCTGGGAG TCAGTGTTGG AGAAGAAACA ACAAAAGCCA ATTAGAACCA 180 

CTATTTTTAA AAAGTGCTTA CTGTGCACAG ATACTCTTCA AGCACTGGAC GTGGATTCTC 240 

TCTCTAGCCC TCAGCACCCC TGCGGTAGGA GTGCCGCCTC TACCCACTTG TGATGGG GT A 300 

30 CAGAGGCACT TGCTCTTCTG CATGGTGTTC AATAGGCTGG GAGTTTTATT TATCTCTTCA 360 

AACTTTGTAC AAGAGCTCAT GGCTTGTCTT GGGCTTTCGT CATTAAACCA AAGGAAATGG 42 0 
AAGCCATTCC CCTGTTGCTC TCCTTAG 

Seq ID NO: 613 Protein sequence 
35 Protein Accession #: XP_098151 

1 11 21 31 41 51 

I I I I I I 

MMHLLNSQGW NEPAGPPESW SGVQSSVFLS VYSSLTVPRP SGVGAGSQCW RRNNKSQLEP 60 

40 LFLKSAYCAQ ILFKHWTWIL SLALSTPAVG VPPLPTCDGV QRHLLFCMVF NRLGVLFISS 120 
NFVQELMACL GLSSLNQRKW KPFPCCSP 

Seq ID NO: 614 DNA sequence 
Nucleic Acid Accession #: NMJ)02658.1 
45 Coding sequence: 77.. 1372 

1 11 21 31 41 51 

I I I I I I 

GTCCCCGCAG CGCCGTCGCG CCCTCCTGCC GCAGGCCACC GAGGCCGCCG CCGTCTAGCG 60 

50 CCCCGACCTC GCCACCATGA GAGCCCTGCT GGCGCGCCTG CTTCTCTGCG TCCTGGTCGT 120 

GAGCGACTCC AAAGGCAG CA ATGAACTTCA TCAAGTTCCA TCGAACTGTG ACTGTCTAAA 180 

TGGAGGAACA TGTGTGTCCA ACAAGTACTT CTCCAACATT CACTGGTGCA ACTGCCCAAA 240 

GAAATTCGGA GGGCAGCACT GTGAAATAGA TAAGTCAAAA ACCTGCTATG AGGGGAATGG 300 

TCACTTTTAC CGAGGAAAGG CCAGCACTGA CACCATGGGC CGGCCCTGCC TGCCCTGGAA 3 60 

55 CTCTGCCACT GTCCTTCAGC AAACGTACCA TGCCCACAGA TCTGATGCTC TTCAGCTGGG 42 0 

CCTGGGGAAA CATAATTACT GCAGGAACCC AGACAACCGG AGGCGACCCT GGTGCTATGT 480 

GCAGGTGGGC CTAAAGCCGC TTGTCCAAGA GTGCATGGTG CATGACTGCG CAGATGGAAA 540 

AAAGCCCTCC TCTCCTCCAG AAGAATTAAA ATTTCAGTGT GGCCAAAAGA CTCTGAGGCC 600 

CCGCTTTAAG ATTATTGGGG GAGAATTCAC CACCATCGAG AACCAGCCCT GGTTTGCGGC 660 

60 CATCTACAGG AGGCACCGGG GGGGCTCTGT CACCTACGTG TGTGGAGGCA GCCTCATCAG 72 0 

CCCTTGCTGG GTGATCAGCG CCACACACTG CTTCATTGAT TACCCAAAGA AGGAGGACTA 780 

CATCGTCTAC CTGGGTCGCT CAAGGCTTAA CTCCAACACG CAAGGGGAGA TGAAGTTTGA 840 

GGTGGAAAAC CTCATCCTAC ACAAGGACTA CAGCGCTGAC ACGCTTGCTC AC CACAACGA 90 0 

CATTGCCTTG CTGAAGATCC GTT CCAAGGA GGGCAGGTGT GCGCAGCCAT CCCGGACTAT 960 

65 ACAGACCATC TGCCTGCCCT CGATGTATAA CGATCCCCAG TTTGGCACAA GCTGTGAGAT 102 0 

CACTGGCTTT GGAAAAGAGA ATTCTACCGA CTATCTCTAT CCGGAGCAGC TGAAAATGAC 1080 

TGTTGTGAAG CTGATTTCCC ACCGGGAGTG TCAGCAGCCC CACTACTACG GCTCTGAAGT 1140 

CACCACCAAA ATGCTATGTG CTGCTGACCC CCAATGGAAA ACAGATTCCT GCCAGGGAGA 12 00 

CTCAGGGGGA CCCCTCGTCT GTTCCCTCCA AGGCCGCATG ACTTTGACTG GAATTGTGAG 1260 

70 CTGGGGCCGT GGATGTGCCC TGAAGGACAA GCCAGGCGTC TACACGAGAG TCT CACACTT 1320 

CTTACCCTGG ATCCGCAGTC ACACCAAGGA AGAGAATGGC CTGGCCCTCT GAGGGTCCCC 13 80 

AGGGAGGAAA CGGGCACCAC CCGCTTTCTT GCTGGTTGTC ATTTTTGCAG TAGAGTCATC 1440 

TCCATCAGCT GTAAGAAGAG ACTGGGAAGA TAGGCTCTGC ACAGATGGAT TTGCCTGTGG 1500 

CACCACCAGG GTGAACGACA ATAGCTTTAC CCTCACGGAT AGGCCTGGGT GCTGGCTGCC 1560 

75 CAGACCCTCT GGCCAGGATG GAGGGGTGGT CCTGACTCAA CATGTTACTG ACCAGCAACT 1620 

TGTCTTTTTC TGGACTGAAG CCTGCAGGAG TTAAAAAGGG CAGGGCATCT CCTGTGCATG 1680 

GGCTCGAAGG GAGAGCCAGC TCCCCCGACC GGTGGGCATT TGTGAGGCCC ATGGTTGAGA 1740 

AATGAATAAT TTCCCAATTA GGAAGTGTAA GCAGCTGAGG TCTCTTGAGG GAGCTTAGCC 1800 

AATGTGGGAG CAGCGGTTTG GGGAGCAGAG ACACTAACGA CTTCAGGGCA GGGCTCTGAT 1860 

80 AT T CCATGAA TGTATCAGGA AATATATATG TGTGTGTATG TTTGCACACT TGTTGTGTGG 192 0 

GCTGTGAGTG TAAGTGTGAG TAAGAGCTGG TGTCTGATTG TTAAGT CTAA ATATTTCCTT 1980 

AAACTGTGTG GACTGTGATG CCACACAGAG TGGTCTTTCT GGAGAGGTTA TAGGTCACTC 2 04 0 

CTGGGGCCTC TTGGGTCCCC CACGTGACAG TGCCTGGGAA TGTACTTATT CTGCAGCATG 210 0 

ACCTGTGACC AGCACTGTCT CAGTTTCACT TT CACATAGA TGTCCCTTTC TTGGCCAGTT 2160 

85 ATCCCTTCCT TTTAGCCTAG TTCATCCAAT CCTCACTGGG TGGGGTGAGG ACCACTCCTT 2220 

ACACTGAATA TTTATATTTC ACTATTTTTA TTTATATTTT TGTAATTTTA AATAAAAGTG 22 80 
ATCAATAAAA TGTGATTTTT CTGA 
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Seq ID NO: 615 Protein sequence 
Protein Accession #: NP_00264 9.1 

5 1 11 21 31 41 51 

I 1 1 I I 1 

MRAIiLARIiLL CVLWSDSKG SNELHQVPSN CDCLNGGTCV SNKYFSNIHW CNCPKKFGGQ 60 

HCEIDKSKTC YEGNGHFYRG KASTDTMGRP CLPWNSATVL QQTYHAHRSD ALQLGLGKHN 120 

YCRNPDNRRR PWCYVQVGLK PLVQECMVHD CADGKKPSSP PEELKFQCGQ KTLRPRFKII 180 

10 GGEFTTIENQ PWFAAIYRRH RGGSVTYVCG GShlSPCWVI SATHCFIDYP KKEDYIVYLG 240 

RSRLNSNTQG EMKFEVENLI LHKDYSADTL AHHNDIALLK IRSKEGRCAQ PSRTIQTICL 300 

PSMYNDPQFG TSCEITGFGK ENSTDYLYPE QLKMTWKLI SHRECQQPHY YGSEVTTKML 360 

CAADPQWKTD SCQGDSGGPL VCSLQGRMTL TGIVSWGRGC ALKDKPGVYT RVSHFLPWIR 420 
SHTKEENGLA L 

15 

Seq ID NO: 616 DNA sequence 

Nucleic Acid Accession #: NM_024422.1 

Coding sequence: 202.. 2907 

20 1 11 21 31 41 51 

I 1 1 ! I 1 

CGCCAAAGGA AAAGCCCCTT GGATGAGAGG CAGGCGCTTC AGAGAAGCTA AGAAAAGCAC 60 

CTCTCCGCGC GCCCCACCTC CTCCGCCTCG CGCTCCTCCT GAGCAGCGGG CCCAGACTGC 12 0 

GCTCCGGCCG CGGCCCTCGC CCCGCGGAGC CCTCCTACCC CGGCCCGACG CTCGGCCCGC 180 

25 GACCTGCCCC GAGCCCTCTC CATGGAGGCA GCCCGCCCCT CCGGCTCCTG GAACGGAGCC 240 

CTCTGCCGGC TGCTCCTGCT GACCCTCGCG AT CTTAATAT TTG CCAGTG A TGCCTGCAAA 300 

AATGTGACAT TACATGTTCC CTCCAAACTA GATGCCGAGA AACTTGTTGG TAGAGTTAAC 3 60 

CTGAAAGAGT GCTTTACAGC TGCAAATCTA ATTCATTCAA GTGATCCTGA CTTCCAAATT 420 

TTGGAGGATG GTTCAGTCTA TACAACAAAT ACTATTCTAT TGTCCTCGGA GAAGAGAAGT 480 

30 TTTACCATAT TACTTTCCAA CACTGAGAAC CAAGAAAAGA AGAAAATATT TGTCTTTTTG 540 

GAGCATCAAA CAAAGGTCCT AAAGAAAAGA CATACTAAAG AAAAAGTTCT AAGGCGCGCC 600 

AAGAGAAGAT GGGCTCCAAT TCCTTGTTCG ATGCTAGAAA ACTCCTTGGG TCCTTTTCCA 660 

CTTTTCCTTC AACAGGTTCA ATCTGACACG GCCCAAAACT ATACCATATA CTATTCCATA 72 0 

AGAGGTCCTG GAGTTGACCA AGAACCTCGG AATTTATTTT ATGTGGAGAG AGACACTGGA 780 

35 AACTTGTATT GTACT CGTCC TGTAGATCGT GAGCAGTATG AATCTTTTGA GATAATTGCC 840 

TTTGCAACAA CTCCAGATGG GTATACTCCA GAACTTCCAC TGCCCCTAAT AATCAAAATA 900 

GAGGATGAAA ATGATAACTA CCCAATTTTT ACAGAAGAAA CTTATACTTT TACAATTTTT 960 

GAAAATTGCA GAGTGGGCAC TACTGTGGGA CAAGTGTGTG CTACTGACAA AGATGAGCCT 102 0 

GACACGATGC ACACACGCCT GAAGTACTCC ATCATTGGGC AGGTGCCACC ATCACCCACC 1080 

40 CTATTTTCTA TGCATCCAAC TACAGGCGTG ATCACCACAA CATCATCTCA GCTAGACAGA 1140 

GAGTTAATTG ACAAGTACCA GTTGAAAATA AAAGTACAAG ACATGGATGG TCAGTATTTT 1200 

GGTCTACAGA CAACTTCAAC TTGTATCATT AACATTGATG ATGTAAATGA CCACTTGCCA 1260 

ACAT TT ACT C GTACTTCTTA TGTGACATCA GTGGAAGAAA ATACAGTTGA TGTGGAAATC 1320 

TTACGAGTTA CTGTTGAGGA TAAGGACTTA GTGAATACTG CTAACTGGAG AGCTAATTAT 1380 

45 ACCATTTTAA AGGGCAATGA AAATGGCAAT TTTAAAATTG TAACAGATGC CAAAACCAAT 1440 

GAAGGAGTTC TTTGTGTAGT TAAGCCTTTG AATTATGAAG AAAAGCAACA GATGAT CTTG 1500 

CAAATTGGTG TAGTTAATGA AGCTCCATTT TCCAGAGAGG CTAGTCCAAG ATCAGCCATG 1560 

AGCACAGCAA CAGTTACTGT TAATGTAGAA GAT CAGGATG AGGGCCCTGA GTGTAACCCT 162 0 

CCAATACAGA CTGTTCGCAT GAAAGAAAAT GCAGAAGTGG GAACAACAAG CAATGGATAT 1680 

50 AAAG CAT ATG ACCCAGAAAC AAGAAGTAGC AGTGGCATAA GGTATAAGAA ATTAACTGAT 1740 

CCAACAGGGT GGGTCACCAT TGATGAAAAT ACAGGATCAA TCAAAGTTTT CAGAAGCCTG 1800 

GATAGAGAGG CAGAGACCAT CAAAAATGGC ATATATAATA TTACAGTCCT TGCATCAGAC 1860 

CAAGGAGGGA GAACATGTAC GGGGACACTG GGCATTATAC TTCAAGACGT GAATGATAAC 192 0 

AGCCCATTCA TACCTAAAAA GACAGTGATC ATCTGCAAAC CCACCATGTC ATCTGCGGAG 1980 

55 ATTGTTGCGG TTGATCCTGA TGAGCCTATC CATGGCCCAC CCTTTGACTT TAGTCTGGAG 2040 

AGTTCTACTT CAGAAGTACA GAGAATGTGG AGACTGAAAG CAATTAATGA TACAGCAGCA 210 0 

CGTCTTTCCT ATCAGAATGA TCCTCCATTT GGCTCATATG TAGTACCTAT AACAGTGAGA 2160 

GATAGACTTG GCATGTCTAG TGTCACTTCA TTGGATGTTA CACTGTGTGA CTGCATTACC 2220 

GAAAATGACT GCACACATCG TGTAGATCCA AGGATTGGCG GTGGAGGAGT ACAACTTGGA 22 80 

60 AAGTGGGCCA TCCTTGCAAT ATTGTTGGGC ATAGCATTGC TCTTTTGCAT CCTGTTTACG 2 340 

CTGGTCTGTG GGGCTTCTGG GACGTCTAAA CAACCAAAAG TAATTCCTGA TGATTTAGCC 2400 

CAGCAGAACC TAATTGTATC AAACACAGAA GCTCCTGGAG ATGACAAAGT GTATTCTGCG 246 0 

AATGGCTTCA CAACCCAAAC TGTGGGCGCT TCTGCTCAGG GAGTTTGTGG CACCGTGGGA 2 520 

TCAGGAATCA AAAACGGAGG TCAGGAGACC ATCGAAATGG TGAAAGGAGG ACACCAGACC 2580 

65 TCGGAATCCT GCCGGGGGGC TGG CCACCAT CACACCCTGG ACTCCTGCAG GGGAGGACAC 2 640 

ACGGAGGTGG ACAACTGCAG ATACACTTAC TCGGAGTGGC ACAGTTTTAC TCAGCCCCGT 2 70 0 

CTTGGTGAAA AAGTGTATCT GTGTAATCAA GATGAAAATC ACAAGCATGC CCAAGACTAT 2760 

GTCCTGACAT ATAACTATGA AGGAAGAGGA TCGGTGGCTG GGT CTGTAGG TTGTTGCAGT 282 0 

GAACGACAAG AAGAAGATGG GCTTGAATTT TTGGATAATT TGGAGCCCAA ATTTAGGACA 2 8 80 

70 CTAGCAGAAG CATGCATGAA GAGATGAGTG TGTTCTAATA AGTCT CTGAA AGCCAGTGGC 2 940 

TTTATGACTT TTAAAAAAAA TTACAAACCA AGAATTTTTT AAAGCAGAAG ATGCTATTTG 3 000 

TGGGGGTTTT TCTCTCATTA TTTGGATGGA ATCTCTTTGG TCAAATGCAC ATTTACAGAG 3 060 

AGACACTATA AACAAGTACA CAAATTTTTC AATTTTTACA TATTTTTAAA TTACTTATCT 3120 

TCT AT CCAAG GAGGTCTACA GAGAAATTAA AGTCTGCCTT ATTTGTTACA TTTGGGTATA 3180 

75 ATGACAACAG CCAATTTATA GTGCAATAAA ATGTAATTAA TTCAAGTCCT TATTATAGAC 3240 

TATTTGAAGC ACAACCTAAT GGAAAATTGT AGAGACCTTG CTTTAACATT ATCTCCAGTT 33 00 

AATTAAGTGT TCATGTGGTG CTTGGAAACT GTTGTTTTCC TGAACATCTA AAGTGTGTAG 3 3 60 

ACTGCATTCT TGCTATTATT TTATTCTTGT AATGTGACCT TTTCACTGTG CAAAGGGAGA 342 0 
TTTCTAGCCA GGCATTGACT ATTACAATTT CATT 

80 

Seq ID NO: 617 Protein sequence 
Protein Accession #: NP_077740.1 

1 11 21 31 41 51 

85 | | | 1 I I 

MEAARPSGSW NGALCRLLLL TLAILIFASD ACKNVTLHVP SKLDAEKLVG RVNLKECFTA 60 

ANLIHSSDPD FQILEDGSVY TTNTILLSSE KRSFTILLSN TENQEKKKIF VFLEHQTKVL 12 0 
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KKRHTKEKVL RRAKRRWAPI 
EPRNLFYVER DTGNLYCTRP 
PIFTEETYTF T I FENCRVGT 
TGVITTTSSQ DDRELIDKYQ 
VTSVEENTVD VEI LRVTVED 
KPLNYEEKQQ MILQIGWNE 
KENAEVGTTS NGYKAYDPET 
KNGIYNITVL ASDQGGRTCT 
EPIHGPPFDF SLiESSTSEVQ 
VTSLDVTLCD CITENDCTHR 
TSKQPKVIPD DLAQQNLIVS 
QETIEMVKGG HQTSESCRGA 
CNQDENHKHA QDYVLTYNYE 
R 
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PCSMLENSLG 
VDREQYESFE 
TVGQVCATDK 
LKIKVQDMDG 
KDLVNTANWR 
APFSREASPR 
RSSSGIRYKK 
GTLGI ILQDV 
RMWRLKAIND 
VDPRIGGGGV 
NTEAPGDDKV 
GHHHTLDSCR 
GRGSVAGSVG 



PFPLFLQQVQ 
I I AFATTPDG 
DEPDTMHTRL 
QYFGLQTTST 
ANYTILKGNE 
SAMSTATVTV 
LTDPTGWVTI 
NDNSPFIPKK 
TAARLSYQND 
QLGKWAILAI 
YSANGFTTQT 
GGHTEVDNCR 
CCSERQEEDG 



SDTAQNYTIY 
YTPELPLPLI 
KYSIIGQVPP 
CI INIDDVND 
NGNFKIVTDA 
NVEDQDEGPE 
DENTGSIKVF 
TVIICKPTMS 
PPFGSYWPI 
LLGIALLFCI 
VGASAQGVCG 
YTYSEWHSFT 
LEFLDNLEPK 



YSIRGPGVDQ 
IKIEDENDNY 
SPTLFSMHPT 
HliPTFTRTSY 
KTNEGVLCW 
CNPPIQTVRM 
RSLDREAETI 
SAEIVAVDPD 
TVRDRLGMSS 
LFTLVCGASG 
TVGSGIKNGG 
QPRLGEKVYL 
FRTLAEACMK 



Seq ID NO: 618 DNA sequence 

Nucleic Acid Accession #: NM_004949.1 

Coding sequence: 202.. 2745 



80 



CG CCAAAGG A 
CTCTCCGCGC 
GCTCCGGCCG 
GACCTGCCCC 
CTCTGCCGGC 
AATGTGACAT 
CTGAAAGAGT 
TTGGAGGATG 
TTTACCATAT 
GAGCATCAAA 
AAGAGAAGAT 
CTTTTCCTTC 
AGAGGTCCTG 
AACTTGTATT 
TTTGCAACAA 
GAGGATGAAA 
GAAAATTGCA 
GACACGATGC 
CTATTTTCTA 
GAGTTAATTG 
GGT CTACAGA 
ACATTTACTC 
TTACGAGTTA 
ACCATTTTAA 
GAAGGAGTTC 
CAAATTGGTG 
AGCACAGCAA 
CCAATACAGA 
AAAGCATATG 
CCAACAGGGT 
GATAGAGAGG 
CAAGGAGGGA 
AGCCCATTCA 
ATTGTTGCGG 
AGTTCTACTT 
CGTCTTTCCT 
GATAGACTTG 
* GAAAATGACT 
AAGTGGGCCA 
CTGGTCTGTG 
CAGCAGAACC 
AAFGGCTTCA 
TCAGGAATCA 
TCGGAATCCT 
ACGGAGGTGG 
CTTGGTGAAG 
GTATCTGTGT 
CTATGAAGGA 
AGATGGGCTT 
CATGAAGAGA 
AAAAAATTAC 
TCATTATTTG 
AGTACACAAA 
T CT AC AG AG A 
TTTATAGTGC 
CCTAATGGAA 
GTGGTGCTTG 
ATTATTTTAT 
TTGACTATTA 



11 
I 

AAAGCCCCTT 
GCCCCACCTC 
CGGCCCTCGC 
GAGCCCTCTC 
TGCTCCTGCT 
TACATGTTCC 
GCTTTACAGC 
GTTCAGTCTA 
TACTTTCCAA 
CAAAGGT CCT 
GGGCTCCAAT 
AACAGGTTCA 
GAGTTGACCA 
GTACTCGTCC 
CTCCAGATGG 
ATGATAACTA 
GAGTGGGCAC 
ACACACGCCT 
TGCATCCAAC 
ACAAGTACCA 
CAACTTCAAC 
GTACTTCTTA 
CTGTTGAGGA 
AGGGCAATGA 
TTTGTGTAGT 
TAGTTAATGA 
CAGTTACTGT 
CTGTTCGCAT 
ACCCAGAAAC 
GGGTCACCAT 
CAGAGACCAT 
GAACATGTAC 
TACCTAAAAA 
TTGATCCTGA 
CAGAAGTACA 
ATCAGAATGA 
GCATGTCTAG 
GCACACATCG 
TCCTTGCAAT 
GGGCTTCTGG 
TAATTGTATC 
CAACCCAAAC 
AAAACGGAGG 
GCCGGGGGGC 
ACAACTG CAG 
AAT CCATTAG 
AATCAAGATG 
AG AGG AT CGG 
GAATTTTTGG 
TGAGTGTGTT 
AAACCAAGAA 
GATGGAATCT 
TTTTTCAATT 
AATTAAAGTC 
AATAAAATGT 
AATTGTAGAG 
GAAACTGTTG 
TCTTGTAATG 
CAATTT CATT 



21 
I 

GGATGAGAGG 
CTCCGCCTCG 
CCCGCGGAGC 
CATGGAGGCA 
GACCCTCGCG 
CTCCAAACTA 
TGCAAATCTA 
TACAACAAAT 
CACTGAGAAC 
AAAGAAAAGA 
TCCTTGTTCG 
ATCTGACACG 
AGAACCTCGG 
TGTAGATCGT 
GTATACTCCA 
CCCAATTTTT 
TACTGTGGGA 
GAAGTACTCC 
TACAGGCGTG 
GTTGAAAATA 
TTGTATCATT 
TGTGACATCA 
TAAGGACTTA 
AAATGGCAAT 
TAAGCCTTTG 
AGCTCCATTT 
TAATGTAGAA 
GAAAGAAAAT 
AAGAAGTAGC 
TGATGAAAAT 
CAAAAATGGC 
GGGGACACTG 
GACAGTGATC 
TGAGCCTATC 
GAGAATGTGG 
TCCTCCATTT 
TGTCACTTCA 
TGTAGATCCA 
ATTGTTGGGC 
GACGTCTAAA 
AAACACAGAA 
TGTGGGCGCT 
TCAGGAGACC 
TGGCCACCAT 
ATACACTTAC 
AGGACACACT 
AAAATCACAA 
TGGCTGGGTC 
ATAATTTGGA 
CTAATAAGTC 
TTTTTTAAAG 
CTTTGGTCAA 
TTTACATATT 
TGCCTTATTT 
AAT T AAT T CA 
ACCTTGCTTT 
TTTTCCTGAA 
TGACCTTTTC 



31 
I 

CAGGCGCTTC 
CGCTCCTCCT 
CCTCCTACCC 
GCCCGCCCCT 
ATCTTAATAT 
GATGCCGAGA 
ATTCATTCAA 
ACTATTCTAT 
CAAGAAAAGA 
CATACTAAAG 
ATGCTAGAAA 
GCCCAAAACT 
AATTTATTTT 
GAGCAGTATG 
GAACTTCCAC 
ACAGAAGAAA 
CAAGTGTGTG 
ATCATTGGGC 
ATCACCACAA 
AAAGTACAAG 
AACATTGATG 
GTGGAAGAAA 
GTGAATACTG 
TTTAAAATTG 
AATTATGAAG 
TCCAGAGAGG 
GATCAGGATG 
GCAGAAGTGG 
AGTGGCATAA 
ACAGGATCAA 
ATATATAATA 
GGCATTATAC 
ATCTGCAAAC 
CATGGCCCAC 
AGACTGAAAG 
GGCTCATATG 
TTGGATGTTA 
AGGATTGGCG 
ATAGCATTGC 
CAACCAAAAG 
GCTCCTGGAG 
TCTGCTCAGG 
ATCGAAATGG 
CACACCCTGG 
TCGGAGTGGC 
CTGATTAAAA 
GCATGCCCAA 
TGTAGGTTGT 
GCCCAAATTT 
TCTGAAAGCC 
CAGAAGATGC 
ATGCACATTT 
TTTAAATTAC 
GTTACATTTG 
AGTCCTTATT 
AACATTATCT 
CAT CT AAAGT 
ACTGTGCAAA 



41 
I 

AGAGAAGCTA 
GAGCAGCGGG 
CGGCCCGACG 
CCGGCTCCTG 
TTGCCAGTGA 
AACTTGTTGG 
GTGATCCTGA 
TGTCCTCGGA 
AGAAAATATT 
AAAAAGTTCT 
ACTCCTTGGG 
ATACCATATA 
ATGTGGAGAG 
AATCTTTTGA 
TGCCCCTAAT 
CTTATACTTT 
CTACTGACAA 
AGGTGCCACC 
CATCATCTCA 
ACATGGATGG 
ATGTAAATGA 
ATACAGTTGA 
CTAACTGGAG 
TAACAGATGC 
AAAAGCAACA 
CTAGTCCAAG 
AGGGCCCTGA 
GAACAACAAG 
GGTATAAGAA 
TCAAAGTTTT 
TTACAGTCCT 
TTCAAGACGT 
CCACCATGTC 
CCTTTGACTT 
CAATTAATGA 
TAGTACCTAT 
CACTGTGTGA 
GTGGAGGAGT 
TCTTTTGCAT 
TAATTCCTGA 
ATGACAAAGT 
GAGTTTGTGG 
TGAAAGGAGG 
ACTCCTGCAG 
ACAGTTTTAC 
ATTAAACAAT 
GACTATGTCC 
TGCAGTGAAC 
AGGACACTAG 
AGTGGCTTTA 
TATTTGTGGG 
ACAGAGAGAC 
TTATCTTCTA 
GGTATAATGA 
ATAGACTATT 
CCAGTTAATT 
GTGTAGACTG 
GGGAGATTTC 



51 

I 

AGAAAAGCAC 
CCCAGACTGC 
CTCGGCCCGC 
GAACGGAGCC 
TGCCTGCAAA 
TAGAGTTAAC 
CTTCCAAATT 
GAAGAGAAGT 
TGTCTTTTTG 
AAGGCGCGCC 
TCCTTTTCCA 
CTATTCCATA 
AGACACTGGA 
GATAATTGCC 
AATCAAAATA 
TACAATTTTT 
AGATGAGCCT 
ATCACCCACC 
GCTAGACAGA 
TCAGTATTTT 
CCACTTGCCA 
TGTGGAAATC 
AGCTAATTAT 
CAAAACCAAT 
GATGATCTTG 
ATCAGCCATG 
GTGTAACCCT 
CAATGGATAT 
ATTAACTGAT 
CAGAAGCCTG 
TGCATCAGAC 
GAATGATAAC 
ATCTGCGGAG 
TAGTCTGGAG 
TACAGCAGCA 
AACAGTGAGA 
CTGCATTACC 
ACAACTTGGA 
CCTGTTTACG 
TGATTTAGCC 
GTATTCTGCG 
CACCGTGGGA 
ACACCAGACC 
GGGAGGACAC 
TCAGCCCCGT 
GAAAGAAAGT 
TGACATATAA 
GACAAGAAGA 
CAGAAGCATG 
TGACTTTTAA 
GGTTTTTCTC 
ACTATAAACA 
TCCAAGGAGG 
CAACAGCCAA 
TGAAGCACAA 
AAGTGTTCAT 
CATTCTTGCT 
TAGCCAGGCA 



180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 



Seq ID NO: 619 Protein sequence 
Protein Accession #: NP 004940.1 



85 1 11 21 31 41 51 

I I I I I I 

MEAARPSGSW NGALCRLLLL TLAILIFASD ACKNVTLHVP SKI/DAEKLVG RVWLKECFTA 



60 



425 




426 



WO 02/086443 PCT/US02/12476 

GCGTCAAAAG GAACGATGCA GGATCCTATG AATGTGAAAT ACAGAACCCA GCGAGTGCCA 720 

ACCGCAGTGA CCCAGTCACC CTGAATGTCC TCTATGGCCC AGATGTCCCC ACCATTTCCC 780 

CCTCAAAGGC CAATTACCGT CCAGGGGAAA ATCTGAACCT CTCCTGCCAC GCAGCCTCTA 840 

ACCCACCTGC ACAGTACTCT TGGTTTATCA ATGGGACGTT CCAGCAATCC ACACAAGAGC 900 

5 TCTTTATCCC CAACATCACT GTGAATAATA GCGGATCCTA TATGTGCCAA GCCCATAACT 960 

CAGCCACTGG CCTCAATAGG ACCACAGTCA CGATGATCAC AGTCTCTGGA AGTGCTCCTG 1020 

TCCTCTCAGC TGTGGCCACC GTCGGCATCA CGATTGGAGT GCTGGCCAGG GTGGCTCTGA 1080 

TATAGCAGCC CTGGTGTATT TTCGATATTT CAGGAAGACT GGCAGATTGG ACCAGACCCT .1140 

GAATTCTTCT AGCTCCTCCA ATCCCATTTT ATCCCATGGA ACCACTAAAA ACAAGGTCTG 1200 

10 CTCTGCTCCT GAAGCCCTAT ATGCTGGAGA TGGACAACTC AATGAAAATT TAAAGGGAAA 12 60 

ACCCTCAGGC CTGAGGTGTG TGCCACTCAG AGACTTCACC TAACTAGAGA CAGTCAAACT 1320 

GCAAACCATG GTGAGAAATT GACGACTTCA CACTATGGAC AGCTTTTCCC AAGATGT CAA 13 80 

AACAAGACTC CTCATCATGA TAAGGCTCTT ACCCCCTTTT AATTTGTCCT TGCTTATGCC 1440 

TGCCTCTTTC GCTTGGCAGG ATGATGCTGT CATTAGTATT TCACAAGAAG TAGCTTCAGA 1500 

15 GGGTAACTTA ACAGAGTGTC AGAT CTATCT TGTCAATCCC AACGTTTTAC ATAAAATAAG 1560 

AGATCCTTTA GTGCACCCAG TGACTGACAT TAGCAGCATC TTTAACACAG CCGTGTGTTC 162 0 

AAATGTACAG TGGTCCTTTT CAGAGTTGGA CTTCTAGACT CACCTGTTCT CACTCCCTGT 1680 

TTTAATTCAA CCCAGCCATG CAATGCCAAA TAATAGAATT GCTCCCTACC AGCTGAACAG 1740 

GGAGGAGTCT GTGCAGTTTC TGACACTTGT TGTTGAACAT GGCTAAATAC AATGGGTATC 1800 

20 GCTGAGACTA AGTTGTAGAA ATTAACAAAT GTGCTGCTTG GTTAAAATGG CTACACTCAT 18 60 

CTGACTCATT CTTTATTCTA TTTTAGTTGG TTTGTATCTT GCCTAAGGTG CGTAGTCCAA 1920 

CTCTTGGTAT TACCCTCCTA ATAGTCATAC TAGTAGTCAT ACTCCCTGGT GTAGTGTATT 1980 

CTCTAAAAGC TTTAAATGTC TGCATGCAGC CAGCCATCAA ATAGTGAATG GTCTCTCTTT 2 040 

GGCTGGAATT ACAAAACTCA G AG AAATGT G T CAT CAGG AG AAC AT CAT AA CCCATGAAGG 2100 

25 ATAAAAGCCC CAAATGGTGG TAACTGATAA TAG C ACT AAT G CTTTAAG AT TTGGTCACAC 2160 

TCTCACCTAG GTGAGCGCAT TG AG CCAGTG GTGCTAAATG CTACATACTC CAACTGAAAT 222 0 

GTTAAGGAAG AAGATAGATC CAATTAAAAA AAATTAAAAC CAATTTAAAA AAAAAAAAGA 2280 

ACACAGGAGA TTCCAGTCTA CTTGAGTTAG CATAATACAG AAGTCCCCTC TACTTTAACT 2340 

TTTACAAAAA AGTAACCTGA ACT AAT CTGA TGTTAACCAA TGTATTTATT TCTGTGGTTC 2400 

30 TGTTTCCTTG TTCCAATTTG ACAAAACCCA CTGTTCTTGT ATTGTATTGC CCAGGGGGAG 2460 

CTATCACTGT ACTTGTAGAG TGGTGCTGCT TTAATTCATA AATCACAAAT AAAAGCCAAT 2520 

TAGCTCTATA ACT 

Seq ID NO: 62 5 Protein sequence 
35 Protein Accession #: AAA59907.1 

1 11 21 31 41 51 

l l l l I l 

MGPPSAPPCR LHVPWKEVLL TASLLTFWNP PTTAKLTIES TPFNVAEGKE VLLLAHNLPQ 60 

40 NRIGYSWYKG ERVDGNSL IV GYVIGTQQAT PGPAYSGRET IYPNASLLIQ NVTQNDTGFY 120 

TLQVIKSDLV NEEATGQFHV YPELPKPSIS SNNSNPVEDK DAVAFTCEPE VQNTTYIiWWV 180 

NGQSLPVSPR LQLSNGNMTL TLLSVKRNDA GSYECEIQNP ASANRSDPVT LNVLYGPDVP 240 

TISPSKANYR PGENLNLSCH AASNPPAQYS WFINGTFQQS TQELFIPNIT VNNSGSYMCQ 300 
AHNSATGLNR TTVTMITVSG SAPVLSAVAT VGITIGVLAR VALI 

45 

Seq ID NO: 626 DNA sequence 
Nucleic Acid Accession #: M18728.1 
Coding sequence: 1355.. 1657 

50 1 11 21 31 41 51 

1 I I I I 1 

GGAGCTCAAG CTCCTCTACA AAGAGGTGGA CAGAGAAGAC AGCAGAGACC ATGGGACCCC 60 

CCTCAGCCCC TCCCTGCAGA TTGCATGTCC CCTGGAAGGA GGTCCTGCTC ACAGCCTCAC 12 0 

TTCTAACCTT CTGGAACCCA CCCACCACTG CCAAGCTCAC TATTGAATCC ACGCCATTCA 180 

55 ATGTCGCAGA GGGGAAGGAG GTTCTTCTAC TCGCCCACAA CCTGCCCCAG AATCGT AT TG 240 

GTTACAGCTG GTACAAAGGC GAAAGAGTGG ATGGCAACAG TCTAATTGTA GGATATGTAA 300 

TAGGAACTCA ACAAGCTACC CCAGGGCCCG CATACAGTGG TCGAGAGACA ATATACCCCA 3 60 

ATGCATCCCT GCTGATCCAG AACGTCACCC AGAATGACAC AGGATTCTAT ACCCTACAAG 42 0 

TCATAAAGTC AGAT CTTGTG AATGAAGAAG CAACCGGACA GTTCCATGTA TACCCGGAGC 480 

60 TGCCCAAGCC CTCCATCTCC AGCAACAACT CCAACCCCGT GGAGGACAAG GATGCTGTGG 540 

CCTTCACCTG TGAACCTGAG GTTCAGAACA CAACCTACCT GTGGTGGGTA AATGGTCAGA 600 

GCCTCCCGGT CAGTCCCAGG CTGCAGCTGT CCAATGGCAA CATGACCCTC ACTCTACTCA 660 

GCGTCAAAAG GAACGATGCA GGATCCTATG AATGTGAAAT ACAGAACCCA GCGAGTGCCA 720 

ACCGCAGTGA CCCAGTCACC CTGAATGTCC TCTATGGCCC AGATGTCCCC ACCATTTCCC 780 

65 CCTCAAAGGC CAATTACCGT CCAGGGGAAA ATCTGAACCT CTCCTGCCAC GCAGCCTCTA 840 

ACCCACCTGC ACAGTACTCT TGGTTTATCA ATGGGACGTT CCAGCAATCC ACACAAGAGC 900 

TCTTTATCCC CAACATCACT GTGAATAATA GCGGATCCTA TATGTGCCAA GCCCATAACT 960 

CAGCCACTGG CCTCAATAGG ACCACAGTCA CGATGATCAC AGTCTCTGGA AGTGCTCCTG 102 0 

TCCTCTCAGC TGTGGCCACC GTCGGCATCA CGATTGGAGT GCTGGCCAGG GTGGCTCTGA 1080 

70 TATAGCAGCC CTGGTGTATT TTCGATATTT CAGGAAGACT GGCAGATTGG ACCAGACCCT 1140 

GAATTCTTCT AGCTCCTCCA ATCCCATTTT ATCCCATGGA ACCACTAAAA ACAAGGTCTG 1200 

CTCTGCTCCT GAAGCCCTAT ATGCTGGAGA TGGACAACTC AATGAAAATT TAAAGGGAAA 12 60 

ACCCTCAGGC CTGAGGTGTG TGCCACTCAG AGACTTCACC TAACTAGAGA CAGTCAAACT 1320 

GCAAACCATG GTGAGAAATT GACGACTTCA CACTATGGAC AGCTTTTCCC AAGATGTCAA 1380 

75 AACAAGACTC CTCATCATGA TAAGGCTCTT ACCCCCTTTT AATTTGTCCT TGCTTATGCC 1440 

TGCCTCTTTC GCTTGGCAGG ATGATGCTGT CATTAGTATT TCACAAGAAG TAGCTTCAGA 1500 

GGGTAACTTA ACAGAGTGTC AGAT CTATCT TGTCAATCCC AACGTTTTAC ATAAAATAAG 1560 

AGATCCTTTA GTGCACCCAG TGACTGACAT TAGCAGCATC TTTAACACAG CCGTGTGTTC 162 0 

AAATGTACAG TGGTCCTTTT CAGAGTTGGA CTTCTAGACT CACCTGTTCT CACTCCCTGT 1680 

80 TTTAATTCAA CCCAGCCATG CAATGCCAAA TAATAGAATT GCTCCCTACC AGCTGAACAG 1740 

GGAGGAGTCT GTGCAGTTTC TGACACTTGT TGTTGAACAT GGCTAAATAC AATGGGTATC 1800 

GCTGAGACTA AGTTGTAGAA ATTAACAAAT GTGCTGCTTG GTTAAAATGG CTACACTCAT 1860 

CTGACTCATT CTTTATTCTA TTTTAGTTGG TTTGTATCTT GCCTAAGGTG CGTAGTCCAA 192 0 

CTCTTGGTAT TACCCTCCTA ATAGTCATAC TAGTAGTCAT ACTCCCTGGT GTAGTGTATT 1980 

85 CTCTAAAAGC TTTAAATGTC TGCATGCAGC CAGCCATCAA ATAGTGAATG GTCTCTCTTT 204 0 

GGCTGGAATT ACAAAACTCA GAGAAATGTG TCAT CAGGAG AACAT CAT AA CCCATGAAGG 2100 

ATAAAAGCCC CAAATGGTGG TAACTGATAA TAGCACTAAT GCTTTAAGAT TTGGTCACAC 2160 



427 




428 



10 



WO 02/086443 

ATCCAGTGAC AATGTGCCCC 
TTCTAGAGCC AGTCTCTGCC 
GGGGTGGGGG GCGGTGAATC 
AGGTGTCTGG TTGCCCTGCC 
ACAAAACAGC TGACACTGAC 
CCTTCCTTAG GACCTGGGGG 
TCACTCAGAT GTCCTGAAAT 
TTAACACTAG GGGCTGGCCC 
CCCAAAGCGG GGAGGAGATA 
AATAAAAGAA TCTTTAACTT 



PCT/US02/12476 



CTGCCAGCCG 
TCCCAGACGC 
ACCTCTGAGG 
TCTGGCTCCA 
TAAGGAACTG 
CCAGGCTGAC 
TCCACCACGG 
ACTAGGAGGG 
TTTATTTTGG 
TAAAAAAAAA 



GGGCTCGCCC 
GGCGGGAGCC 
CCTGGGCCCA 
GAACAGAAAG 
CAGCATTTGC 
TTGGGGGGCA 
GGGTCACCCT 
CTGGCCCTAA 
GGAGAGTTTG 
AAAAAAAA 



ACTCATCATT 
AAGCTCCTCC 
GGGTTCAGGG 
GGAGCCTCAC 
ACAGGGGAGG 
GACTTGACAC 
GGGGGGTTAG 
GATACAGACC 
GAGGGGAGGG 



CATTCATCCA 480 

AACCACAAGG 540 

GAACCTTCCA 600 

GCTGGCTCAC 660 

GGGGTGCCCT 720 

TAGGCCCCAC 780 

GGACCTATTT 840 

CCCCCAACTC 900 

AGAATTTATT 960 



15 



Seq ID NO: 631 Protein sequence 
Protein Accession #: NP 057723.1 



11 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



21 31 41 51 

I i I I I I 

MARGSLRRLL RLLVLGLWLA LLRSVAGEQA PGTAPCSRGS SWSADLDKCM DCASCRARPH 

SDFCLGCAAA PPAPFRLLWP ILGGALSLTF VLGLLSGFLV WRRCRRRBKF TTPIEETGGE 

GCPAVALIQ 

Seq ID NO: 632 DNA sequence 

Nucleic Acid Accession #: NMJD03816.1 

Coding sequence: 7 9.-2 53 8 



85 



CGGCAGGGTT 
CCTGCGGAAT 
CGGTGGTTGC 
CAACAGACCT 
AGAAGAGAAG 
AAAG AG CAT A 
TATACTTACA 
CATTATCGGG 
GGACTCAGAG 
AGCTCTCATT 
TGTGGAGTTT 
CCCAGCATGA 
GAGCTGTTCA 
GTGAGAGAAG 
ATTCGAATTG 
GGGGGTGCTG 
CGT CGGAGAC 
ATGGCATTTG 
CAAATCACTG 
ATGAAT CACG 
GGAGCATCGG 
TTAAATAAAG 
CCCTCCTGTG 
GAATGTGAAT 
TGTGCATATG 
GGAAAAACCA 
CCAGATGTTT 
GGCATGTGCC 
GCCCCCAAAG 
TTCTCTGGCA 
TGTGAGAATG 
AGTCGAGGCA 
GGGATGGTTA 
GTAGATGCTT 
GTATGTAATA 
ACTAAAGGAT 
TTGAGGGACG 
TTTATCTTCA 
ACATATGAGT 
CGACATGTTT 
GTACCAACCT 
CCGAAAGTAT 
TATAGTTCCC 
CTAATACTTT 
GAAAACAAAA 
AGTTGTGAAA 
CATCATTGAA 
TGAACATGTT 
AGTGTTTAAG 
AACATGTGAT 
TTTTTCATCA 
CATGAATAAG 
TTATTTTGAA 
TCCATTTTTA 
GAATTTCTAT 
TAAATTATAA 
GGCTATAATA 
CTTGAGAATT 
AGAATGTTTA 
CATAGAAATT 
TTACTGTGGT 



11 

I 

GGAAAATGAT 
CGGCCGAGAT 
TGTTGCTTGG 
CACATCTTTC 
CCCCTAGGCC 
TTATTCACTT 
ACAAGGAAGG 
GCTATGTGGA 
GATTGCTGCA 
TTGAGCACAT 
CCAACAAGGA 
CTCAGCTACT 
TTGTCGTAGA 
AGATGATTCT 
TGCTAGT TGG 
GTGATGTGCT 
ATGACAGTGC 
TGGGAACAGT 
TGG AG AC AT T 
ATGATGGGAG 
GTTCCAGAAA 
GAGGAAA CTG 
GTAATAAGTT 
TGGACCCTTG 
GTGACTGTTG 
GTGAGTGTGA 
TTATTCAGAA 
AGTATTATGA 
ATTGTTTCAT 
ATGAATACAA 
TACAAGAGAT 
CCAAATGTTG 
ACGAAGGCAC 
CTGTTCTGAA 
GCAATAAGAA 
ACGGAGGAAG 
GACTTCTGGT 
TCAAGAGGGA 
CAGATGGCAA 
CTCCAGTGAC 
ATGCAGCCAA 
CATCT CAGGG 
T CACT TG ATT 
TTTTTTTTCT 
CACCACAAAA 
TACAAGGAAA 
TAAGTCTTAT 
ATTGCAGTGA 
TGTTATTCTG 
AATCTAATAC 
TGCACGAATT 
CAAATATTGT 
AGTACAAAAT 
TGACCTTTCA 
TATGAATCAT 
GCTTTAAGGT 
AAGCAGGAGC 
TCATGAGCAC 
CATTTACTAA 
AGGCTGGAGA 
ATCTATGAGT 



21 



GGAAGAGGCG 
GGGGTCTGGC 
CCTGGTGGGC 
TTCTTATGAA 
CTATTCAAAA 
GGAAAGGAAC 
GACTTTAATC 
GGGAGTTCAT 
TTTAGAGAAT 
CATTTATCGA 
TATAGAGAAA 
TCGAAGAAGA 
CAAGGAAAGG 
CCTGGCAAAC 
ACTGGAGATT 
GGGGAACTTC 
ACAGCTAGTT 
GTGTTCAAGG 
TGCTTCCATT 
AGATTGTTCC 
CTTTAGCAGT 
CCTTCTTAAT 
GGTGGACGCT 
CTGCGAAGGA 
TAAAGACTGT 
TGTTCCAGAG 
TGGATATCCT 
TGCTCAATGT 
TGAAGTGAAT 
GAAGTGTGCC 
ACCTGTATTT 
GGGTGTGGAT 
AAAATGTGGT 
TTATGACTGT 
TTGTCACTGT 
TGTGGACAGT 
CTTCTTCTTC 
TCAACTGTGG 
AAATCAAGCA 
ACCTCCCAGA 
GCAACCTCAG 
AAACTTAATT 
TTTTTAACCT 
TGATGTTTTC 
CAGACTTCAC 
TG CAGTAAAG 
TCAGTCATCG 
TTCTCAAATT 
AATTTTCTAC 
CTGTGAAAAC 
AATAATCATC 
CTTCAAAAGA 
ATACTAAAAG 
ACTATAGGTA 
GTGAAAGCAT 
ACGAAGTATT 
AATTATAAAA 
TTTAAAATCT 
GGTGTGCTGG 
AAGAAGGAAG 
TATCATCTTA 



31 
I 

GAGGTGGAGG 
GCGCGCTTTC 
CCAGTCCTCG 
ATTATAACTC 
CAAGTATCTT 
AAAGACCTTT 
ACTGACCATC 
AATTCATCCA 
GCGAGTTATG 
ATGGATGATG 
GAAACTGCAA 
AGAGCTGTCT 
TATGACATGA 
TACTTGGATA 
TGGACCAATG 
GTGCAGTGGC 
CTAAAGAAAG 
AGCCACGCAG 
GTTGCTCATG 
TGTGGAGCAA 
TGCAGTGCAG 
ATTCCAAAGC 
GGGGAAGAGT 
AGTACCTGTA 
CGGTTCCTTC 
TACTGCAATG 
TGCCAGAATA 
CAAGT CATCT 
TCTAAAGGTG 
ACTGGGAATG 
GGAATTGTGC 
TTCCAGCTAG 
GCTGGAAAGA 
GATGTTCAGA 
•GAAAATGGCT 
GGACCTACAT 
CTAATTGTTC 
AGAAGCTACT 
AACCCTTCTA 
GAAGTTCCTA 
CAGTTCCCAT 
CCTGCCCGTC 
TCTTTTTGCA 
TTGAAAAGCC 
TAACACAGAA 
CCAGGGAATT 
GTGAGGTTAA 
AACTGTATTG 
CTTAGTTATC 
TGACTAATCA 
ATACTCTAGA 
ATGCACAAGA 
AGTGTGTGTG 
ATAACTCTTA 
GACATTCGTT 
TAATAGATCT 
TCTTCAATCA 
GAACTTTCAA 
GTCATGTAAA 
AAATGGTTTT 
GCTGTGTTAA 



41 

I 

CGACCGAGTG 
CCTCGGGGAC 
GTGCGGCGCG 
CTTGGAGATT 
ATGTTATTCA 
TGCCTGAAGA 
CCAATATACA 
TTGCTCTTAG 
GGATTGAACC 
TCTACAAAGA 
AGGATGAAGA 
TGCCACAGAC 
TGGGAAGAAA 
GTATGTATAT 
GAAACCTGAT 
GGGAAAAGTT 
GTTTTGGTGG 
GCGGGATTAA 
AATTGGGTCA 
AGAGCTGCAT 
AGGACTTTGA 
CTGATGAAGC 
GTGACTGTGG 
AGCTTAAATC 
CAGGAGGTAC 
GTTCTTCTCA 
ACAAAGCCTA 
TTGGCTCAAA 
ACAGAT TTGG 
CTTTGTGTGG 
CTGCTATTAT 
GATCAGATGT 
TCTGTAGAAA 
AAAAGTGTCA 
GGGCTCCCCC 
ACAATGAAAT 
CCCTTATTGT 
TCAGAAAGAA 
GACAGCCGGG 
TATATGCAAA 
CAAGGCCACC 
CTGCTCCTGC 
AATGTCTTCA 
TTTCTGTTGC 
AAACAGAAAC 
TACAATAACA 
TGC ACT AAT C 
GTGTAAGATT 
ATTAATGTAG 
GCTGCCAATA 
ATCTTGTCTG 
ACCACAATTA 
TATTCACGCA 
GAGAAATTAA 
CACAATAGCA 
AATCAAATAT 
ATTGAACTTT 
AGCTTGCTAT 
ATATTAGACA 
CTTAAATACC 
AAATGAATTT 



51 
I 

CTGAGAGGAA 
CCTTCGTGTC 
GCCAGGCTTT 
AACTAGAGAA 
GGCTGAAGGA 
TTTTGTGGTT 
GAATCATTGT 
CGACTGTTTT 
CCTGCAGAAC 
GCCTCTGAAA 
GGAAGAGCCT 
CCGGTATGTG 
TCAGACTGCT 
TATGTTAAAT 
CAACATAGTT 
TCTTATCACA 
AACTGCAGGA 
TGTGTTTGGA 
TAATCTTGGA 
CATGAATTCA 
GAAGTTAACT 
CTATAGTGCT 
TACTCCAAAG 
ATTTGCTGAG 
TTTATGCCGA 
GTTCTGTCAG 
TTGCTACAAC 
AGCCAAGGCT 
CAATTGTGGT 
AAAGCTTCAG 
TCAAACGCCT 
TCCAGATCCT 
CTTCCAGTGT 
TGGACATGGG 
AAATTGTGAG 
GAATACTGCA 
CTGTGCTATT 
GAG AT CACAA 
GAGTGTTCCT 
CAGATTTGCA 
TCCACCACAA 
ACCTCCTTTA 
GGGAACTGAG 
AACTATGAAT 
TGAGTGTGAG 
TTTCCGTTTC 
ATGGATTTTT 
TTTGTCATTA 
TTCCTCATTG 
ATATCTAATA 
TCACTCACTA 
AGATGTCATA 
GTTACTCGCT 
TTTAATATTA 
CTATTTTAAA 
GTTGATTCAT 
TACAAAACCA 
TAAATCATTT 
CTAATATTTT 
TACAAAAAAG 
TTACTATGGC 



60 
120 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 



429 



WO 02/086443 

AGATATGGTA TGGATCGTAA AATTTTAAGC ACTAAAAATT TTTTCATAAC CTTTCATAAT 3720 
AAAGTTTAAT AATAGGTTTA TTAACTGAAT TTCATTAGTT TTTTAAAAGT GTTTTTGGTT 3780 
TGTGTATATA TACATATACA AATACAACAT T T ACAAT AAA TAAAATACTT GAAATTCTCA 3840 
AAAAAAAAAA AAAAAAAAAA AAAAA 



PCT/US02/12476 



Seg ID NO*. 633 Protein sequence 
Protein Accession #: NP 003 807.1 



10 



15 



20 



25 



30 



35 



40 



MGSGARFPSG 
PYSKQVSYVI 
EGVHNSSIAL 
D I EKETAKDE 
LLANYLDSMY 
AQLVLKKGFG 
RDCSCGAKSC 
LVD AGEECD C 
DVPEYCNGSS 
IEVNSKGDRF 
WGVDFQLGSD 
NCHCENGWAP 
DQLWRSYFRK 
KQPQQFPSRP 



11 
I 

TLRVRWLLLL 
QAEGKEHI IH 
SDCFGLRGLL 
EEEPPSMTQL 
IMLNIRIVLV 
GTAGMAFVGT 
IMNSGASGSR 
GTPKECELDP 
QFCQPDVFIQ 
GNCGFSGNEY 
VPDPGMVNEG 
PNCETKGYGG 
KRSQTYESDG 
PPPQPKVSSQ 



21 
I 

GLVGPVLGAA 
LERNKDLLPE 
HLENASYGIE 
LRRRRAVLPQ 
GLiEIWTNGNL 
VCSRSHAGGI 
NFSSCSAEDF 
CCEGSTCKLK 
NGYPCQNNKA 
KKCATGNALC 
TKCGAGKICR 
SVDSGPTYNE 
KNQANPSRQP 
GNLIPARPAP 



31 
I 

RPGFQQTSHL 
DFWYTYNKE 
PLQNSSHFEH 
TRYVELFIW 
INIVGGAGDV 
NVFGQITVET 
EKLTLNKGGN 
SFAECAYGDC 
YCYNGMCQYY 
GKLQCENVQE 
NFQCVDASVL 
MNTALRDGtiL 
GSVPRHVSPV 
APPLYSSLT 



Seq ID NO: 634 DNA sequence 

Nucleic Acid Accession #: NM_0 02 091.1 

Coding sequence: 56.. 503 



45 



AGTCTCTGCT 
CGGCAGTGAG 
AGCGGTCCCG 
CCACTGGGCG 
TGAGAGAGGG 
GAATTTGCTG 
GGCCTTGGGC 
AGGTTCAAAA 
CCCCCAGCTG 
TAAGAGACTG 
AAATATTTGA 
CTTCTGGTTT 
TTTTTATATC 
TAAAAGCTTA 



CTTCCCAGCC 
CTCCCGCTGG 
CTGCCTGCGG 
GTGGGGCACT 
AGCCTGAAGC 
GGTCTCATAG 
AATCAGCAGC 
GGCAAAGTTG 
AACCAGCAAT 
AGTTCTGCAA 
CTATTCTGTA 
AAACTTGTTT 
TAGGCTACCT 
AACACAT 



21 

1 

TCTCCGGCGC 
TCCTGCTGGC 
GCGGAGGGAC 
TAATGGGGAA 
AGCAGCTGAG 
AAGCAAAGGA 
CTTCGTGGGA 
GTAGACTCTC 
GATAATGATG 
GCATCAGTTC 
TCTTTCATCC 
GCTGTGAACA 
GTTGGTTAGA 



31 



GCTCCAAGGG 
GCTGGTCCTC 
CGTGCTGACC 
AAAGAGCACA 
AGAGTACATC 
GAACAGAAAC 
TTCAGAGGAT 
TGCTCCAGGT 
GCCTCTCTCA 
TACGGATCAT 
TTGACTAAAT 
ATTGTCGAAA 
TTCAAGGCCC 



41 

I 

SSYEIITPWR 
GTLITDHPNI 
I I YRMDDVYK 
DKERYDMMGR 
LGNFVQWREK 
FAS I VAHELG 
CLLNIPKPDE 
CKDCRFLPGG 
DAQCQVIFGS 
IPVFGIVPAI 
NYDCDVQKKC 
VFFFLIVPLI 
TPPREVPIYA 



51 
I 

LTRERREAPR 
QNHCHYRGYV 
EPLKCGVSNK 
NQT AVREEM I 
FLITRRRHDS 
HNLGMNHDDG 
AYSAPSCGNK 
TLCRGKTSEC 
KAKAAPKDCF 
IQTPSRGTKC 
HGHGVCNSNK 
VCAIFIFIKR 
NRFAVPTYAA 



41 

I 

CTTCCCGTCG 
TGCCTAGCGC 
AAGATGTACC 
GGGGAGTCTT 
AGGTGGGAAG 
CACCAGCCAC 
AGCAGCAACT 
TCTCAACGTG 
AAAGAGAAAA 
CAACAAGATT 
TCGTGATTTT 
AGAGTCTTCC 
CGAGCTGTTA 



51 



GGACCATGCG 
CCCGGGGGCG 
CGCGCGGCAA 
CTTCTGTTTC 
AAGCTGCAAG 
CTCAACCCAA 
TCAAAGATGT 
AAGGAAGGAA 
ACAAAACCCC 
TCCTTGTGCA 
CAAGCAGCAT 
AATTAATGCT 
CCATTCACAA 



60 
12 0 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 



50 



55 



60 



65 



70 



75 



80 



Seq ID NO: 635 Protein sequence 
Protein Accession #: NP_002082.1 

1 11 21 31 41 51 

I I I I I I 

MRGSELPLVL LALVLCLAPR GRAVPLPAGG GTVLTKMYPR GNHWAVGHLM GKKSTGESSS 

VSERGSLKQQ LREYIRWEEA ARNLLGL I EA KENRNHQPPQ PKALGNQQPS WDSEDSSNFK 

DVGSKGKVGR LSAPGSQREG RNPQLNQQ 

Seq ID NO: 63 6 DNA sequence 

Nucleic Acid Accession #: NM_016522.1 

Coding sequence: 2 65.. 12 99 



85 



GCGGAAGCAG 
CTGGCAAAAG 
TTTTCTCCTC 
CCGCACCCCA 
TCGGGGAAGT 
TGCCTCGTGG 
AGCGGAGATG 
GCCACCCTCA 
ACCATCCTCT 
AACACCCAAA 
TACACCTGCT 
CAAGTATCTC 
ATTAGCCTCA 
TCTCCCAAAG 
CGGGAACAGT 
CGGAGAGTAA 
GTCCCCGTGG 
TTCCAGTGGT 
AACAGACCTT 
TACACTTGCG 
CCAGGCGCCG 
CTGCCTCTTC 
CGGGAAAGGC 
CCAAT CAGAT 
GGGAGGGGAA 
CCTTGCAGAT 



11 
I 

CGAGGAGGGA 
CCGAGGCTGG 
CCCGCGCCTC 
CCCACTTCCT 
TGTGGCTGTC 
TCGTGTCTCT 
CCACCTTCCC 
GGTGCACTAT 
ATGCTGGGAA 
CGCAGTACAG 
CGGTGCAGAC 
CCAAAATTGT 
CCTGCATAGC 
CGGTTGGCTT 
CAGGGGACTA 
AGGTCACCGT 
GACAAAAGGG 
ACAAGGATGA 
TCCTCTCAAA 
TGGCCTCCAA 
TCAGCGAGGT 
TGGTCTTGCA 
TGCCGCCACC 
ATATACAAAT 
CAAAGAATAC 
ATTTAGGTAC 



21 
I 

GCCCCCTTTG 
ATTTGGGGGA 
CCGGTCGCCG 
GTGCTCGCCC 
GAGAATGGGG 
CAGGCTGCTG 
CAAAGCTATG 
TGACAACCGG 
TGACAAGTGG 
CATCGAGATC 
AGACAACCAC 
AGAGATTTCT 
AACTGGTAGA 
TGTGAGTGAA 
CGAGTGCAGT 
GAACTATCCA 
GACACTGCAG 
CAAAAGACTG 
ACTCATCTTC 
CAAGCTGGGC 
GAGCAACGGC 
CCTGCTTCTC 
ACCACCACCA 
GAAATTAGAA 
TTTGGGGGGA 
AATGGAGTTT 



31 

1 

GCCGTCCTCC 
GGAATATTAG 
CGGGTTCACC 
GGGGGGCGTG 
GTCTGTGGGT 
TTCCTTGTAC 
GACAACGTGA 
GTCACCCGGG 
TGCCTGGATC 
CAGAACGTGG 
CCAAAGACCT 
TCAGATATCT 
CCAGAGCCTA 
GACGAATACT 
GCCTCCAATG 
CCATACATTT 
TGTGAAGCCT 
ATTGAAGGAA 
TTCAATGTCT 
CACACCAATG 
ACGTCGAGGA 
AAATTTTGAT 
ACACAACAGC 
GAAACACAGC 
AAAGAGTTTT 
TCTTTTCCCA 



41 
I 

GTGGAACCGG 
ACTCGGAGGA 
GCTCAGTCCC 
TGCCGTGCGG 
ACCTGTTCCT 
CCACAGGAGT 
CGGTCCGGCA 
TGGCCTGGCT 
CTCGCGTGGT 
ATGTGTATGA 
CTAGGGTCCA 
CCATTAATGA 
CGGTTACTTG 
TGGAAATT CA 
ACGTGGCCGC 
CAGAAGCCAA 
CAGCAGTCCC 
AGAAAGGGGT 
CTGAACATGA 
CCAGCATCAT 
GGGCAGGCTG 
GTGAGTGCCA 
AATGGCAACA 
CTCATGGGAC 
AAAAAAGAAA 
AACGGGAAGA 



51 
I 

TTTTCCGAGG 
GTCTGCGCGC 
CGCGCTCGCT 
CTGCCGGAGT 
GCCCTGGAAG 
GCCCGTGCGC 
GGGGGAGAGC 
AAACCGCAGC 
CCTTCTGAGC 
CGAGGGCCCT 
CCTCATTGTG 
AGGGAACAAT 
GAGACACATC 
GGGCATCACC 
GCCCGTGGTA 
GGGTACAGGT 
CTCAGCAGAA 
GAAAGTGGAA 
CTATGGGAAC 
GCTATTTGGT 
CGTCTGGCTG 
CTTCCCCACC 
CCGACAGCAA 
AGAAATTTGA 
TTGAAAATTG 
AC AC AG C AC A 



60 
120 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 



430 



WO 02/086443 

CCCGGCTTGG ACCCACTGCA AG CTG CAT CG TGCAACCTCT TTGGTGCCAG TGTGGGCAAG 1620 

GGCTCAGCCT CTCTGCCCAC AGACTGCCCC CACGTGGAAC ATT CTGGAGC TGGCCATCCC 1680 

AAATTCAATC AGTCCATAGA GACGAACAGA ATGAGACCTT CCGGCCCAAG CGTGGCGCTT 1740 

CCGGCCCAAG CGTGGCGCTG CGGGCACTTT GGTAGACTGT GCCACCACGG CGTGTGTTGT 1800 
GAAACGTGAA ATAAAAAGAG CAAAAAAAAA AAAAAAAAA 



PCT/US02/12476 



10 



15 



Seq ID NO: 637 Protein sequence 
Protein Accession #: NP 057606.1 



MGVCGYLFLP 
NRVTRVAWLN 
NHPKTSRVHL 
SEDEYLEIQG 
LQCEASAVPS 
LGHTNASIML 



11 
I 

WKCLWVSLR 
RSTILYAGND 
IVQVSPKIVE 
ITREQSGDYE 
AEFQWYKDDK 
FGPGAVSEVS 



21 



LLFLVPTGVP 
KWCLDPRWL 
ISSDISINEG 
CSASNDVAAP 
RLIEGKKGVK 
NGTSRRAGCV 



31 

I 

VRSGDATFPK 
LSNTQTQYSI 
NNISLTCIAT 
WRRVKVTVN 
VENRPFLSKL 
WLLPLLVLHL 



41 

I 

AMDNVTVRQG 
EIQNVDVYDE 
GRPEPTVTWR 
YPPYISEAKG 
IFFNVSEHDY 
LLKF 



51 



ESATLRCTID 60 

GPYTCSVQTD 120 

HISPKAVGFV 180 

TGVPVGQKGT 240 

GNYTCVASNK 300 



20 



Seq ID NO: 638 DNA sequence 

Nucleic Acid Accession #: NM_012261.1 

Coding sequence: 203.. 1045 



25 



30 



35 



40 



45 



50 



55 



GATTTGCTCT 
ACAGAATACG 
CACTCCAGCG 
CCTCATTCGG 
ACTTCGAGTT 
GGAAAATCTC 
TGGGACGACG 
GGCCAGCAAC 
TGAGGTGAAG 
CGCATATGCA 
GGCGACTTGG 
CAAAGACGCA 
CACCCCCGCT 
TGATCCGCAG 
TATCTCAGAT 
GGAAGAAACC 
CGCGATTTAC 
ATCCCAGTAT 
CCAACTGGAT 
CATAGCTACA 
AACCCACGGA 
ATGCTGGGGA 
TGACTCTCCA 
TTGAAAACAT 
TGCTCCCTTG 
TCATGCTCCC 
GTTTAGTGAT 
AAAACGACTA 
GGGGGACCTG 
TTCTCTGGC 



11 

I 

GCCAGCAGCT 
CGCTCCCTCC 
GCGACTTTGA 
GGCACTGCGA 
CTCCTGATGT 
TCAGGCCTTT 
TGTCTCATGG 
TACGTAGATC 
GGCCGCTGTG 
CTCAAAATGC 
AGGCTGAGCA 
GTCAGTGCTG 
GGGAAGTCCT 
AAGACGGTCA 
TTTGTCTTCA 
TTGCCCCTGA 
CACGTCCACC 
AAG CACATGG 
CAGGTAGAAC 
AT CAAACAGG 
AGGGGGAGAC 
GGAGGGGAGG 
AAGAGCAATA 
GCTTCTTTGA 
GACACAGCTG 
TGCAGCAAGA 
TGTCTTGGGA 
ATGTAACTAT 
AAGAATCAAT 



21 



GTCGGTGCCG 
CTCCCCCTTC 
GGGATTCCCT 
GTATGGATCT 
TGTTCCATAC 
CCACTAACCC 
CAGAGTTTGC 
TGATCACAGA 
GCCACAGCCA 
T CTTTGT AAA 
AAGTGCAGTT 
GGAAGCACAC 
ATGAGTGTCA 
CCATGATCCT 
GTGAAGAGCA 
TTTTGGGGCT 
AC AAAAT G AC 
GCTAGAGGCC 
AACAAAAGCA 
CCTGGGTATC 
TCTTTCGGAT 
AGGGTCTCAG 
AATGCCACTT 
GGAGGAAACC 
GCTTATCCTA 
CCCCTGAAAG 
ATGTTTCACT 
GCAGAGTTGT 
CTGTGTGAGT 



31 

1 

CGCTCGACAC 
TCTGTCCCCC 
CTCTGGCGGC 
CCAAGGAAGA 
AATGGCTCAA 
TGAAAAAGAT 
AGCCAAATTT 
ACAGGCCGAT 
GTCGGAGCTG 
GGAAAGCCAC 
TGTCTACGAC 
AGCCAACTCG 
AGCTCAACAA 
GTCTGCGGTC 
TAAATGCCCA 
CATCTTGGGC 
TGCCAACCAG 
GTTAGGCAGG 
CTTTTCCATC 
TGAGGCTTGC 
TTGTAGGGTG 
ACAGCTTTCG 
GGAGCTGTAT 
CCTTTAGGTT 
TACAGTTGTC 
TGATTCATGC 
GCTACCCGCA 
TTGGACTTCT 
CTGTTTTTCA 



41 

1 

CGAGTCCTAG 
GCCTCTCGCT 
CTCTGCAGCA 
GGGGTCCCCA 
AT CATGGCAG 
ATATTTGTGG 
ATTGTACCTT 
ATCGCATTGA 
CAAGTGTTCT 
AACATGTCCA 
TCCTCGGAGA 
CACCACCTCT 
ACCATTTCAC 
CACATCCAAC 
GTGGATGAGC 
CTCGTCATCA 
GTGCAGATCC 
CACCCCCTAT 
TTGTACACGA 
TTGGCTTGTG 
AAATGGCAAT 
TGCTCATGGT 
CTGGCCCCAA 
CAGAAGAATA 
AATGCACACA 
TTCTGGCTGG 
TCCAGCGACT 
TCCTGTGCCA 
AAATGAAATA 



51 



CTAGGCGCTC 60 

CACCCCGGCC 120 

GCACAGCCGG 180 

GCATCGACAG 2 4 0 

AACAAGAAGT 300 

TGCGGGAAAA 3 60 

ATGATGTGTG 420 

CCCGGGGAGC 480 

GGGTGGATCG 540 

AGGGACCTGA 600 

AAACCCACTT 6 60 

CTGCCTTGGT 72 0 

TGGCCTCTAG 780 

CTTTTGACAT 840 

GGGAGCAACT 900 

TGGTAACACT 960 

CTCGGGACAG 1020 

TCCTGCTCCC 1080 

GATACACCAA 1140 

TCCATGCTTA 1200 

TATTCTCTCC 1260 

GGCTTGGCTT 132 0 

AGTTTAGGGA 1380 

TGGGGTGCTT 1440 

GAATACAACC 1500 

CATTCTGCAT 1560 

GCAGCACCAG 1620 

GGTCCAAGTC 1680 

AAACACACTA 1740 



Seq ID NO: 639 Protein sequence 
Protein Accession #: NP 036393.1 



60 



65 



I 

MDLQGRGVPS 
EFAAKFIVPY 
FVKESHNMSK 
ECQAQQTISL 
LGLILGLVIM 



11 
I 

IDRIiRVLlrMIj 
DVWASNYVDL 
GPEATWRLSK 
ASSDPQKTVT 
VTLAI YHVHH 



21 
I 

FHTMAQIMAE 
ITEQADIALT 
VQFVYDSSEK 
MILSAVHIQP 
KMTANQVQIP 



31 41 51 

I I I 

QEVENLSGLS TNPEKDIFW RENGTTCLMA 60 

RGAEVKGRCG HSQSELQVFW VDRAYALKML 12 0 

THFKDAVSAG KHTANSHHLS ALVT PAGKS Y 180 

FDIISDFVFS EEHKCPVDER EQLEETLPLI 240 
RDRSQYKHMG 



70 



Seq ID NO: 640 DNA sequence 

Nucleic Acid Accession #: NM_002 993.1 

Coding sequence: 64.. 40 8 



75 



80 



85 



GGCACGAGCC 
ACTATGAGCC 
GCGCTGCTCG 
GTCTCTGCTG 
CCCAAAACGA 
GTGGTAGCCT 
AAGAAAGTCA 
ACCATGCATC 
CAGTAAGAAT 
GAAGAGTGTG 
CTAATATAGT 
CAATTGACCA 
TGAAGATAAC 
ATTTCGTATG 
ACTCACTCTT 



11 

I 

AGTCTCCGCG 
TCCCGTCCAG 
CGCTGCTGCT 
TGCTGACAGA 
TTGGTAAACT 
CCCTGAAGAA 
TCCAGAAAAT 
ATAAAATTGC 
AAGAAGGAAG 
GGGGAAAGCC 
ATTTCCACTA 
TATTGTGAGC 
TATTGTATTT 
GAAATAATGT 
CT CAT AAAAT 



21 
i 

CCTCCACCCA 
CCGCGCGGCC 
CCTGCTGACG 
GCTGCGTTGC 
GCAGGTGTTC 
CGGGAAGCAA 
TTTGGACAGT 
CCAGTCTTCA 
GGTTGGTTTT 
TACGCTTCTC 
TTTACTGTTA 
AAAGAATCAC 
CTAT CATACA 
TTTATTAGTG 
AGGAAATATT 



31 
I 

GCTCAGGAAC 
CGTGTCCCGG 
CCGCCGGGGC 
ACTTGTTTAC 
CCCGCAGGCC 
GTTTGTCTGG 
GGAAACAAGA 
GCGGAGCAGT 
TTTCCATTTT 
CCTGAAGTTT 
TTTTACCTGA 
TGGTTATTAG 
TTCCTTAAAG 
TGCTGTTGAG 
TTAGTTCTGT 



41 
I 

CCGCGAACCC 
GTCCTTCGGG 
CCCTCGCCAG 
GCGTTACGCT 
CGCAGTGCTC 
ACCCGGAAGC 
AAAACTGAGT 
TTTCTGGAGA 
CTACATGGAT 
ACAGCTCAGC 
TAAGTTATTG 
TCTTTCAATG 
TCTTACCGAA 
GGAGGTATCC 
TTTCTTGGGG 



51 
I 

TCTCTTGACC 60 

CTCCTTGTGC 12 0 

CGCTGGT CCT 180 

GAGAGTAAAC 240 

CAAGGTGGAA 300 

CCCTTTTCTA 360 

AACAAAAAAG 420 

TCCCTGGACC 480 

TCCCTACTTT 540 

TAATGAAGTA 600 

AACCCTTTGG 660 

AATATTGAAT 720 

AAGGCTGTGG 780 

TGTTGTTCTT 840 

AATATGTTAC 900 



431 



10 



WO 02/086443 

TCTTTACCCT AGGATGCTAT 
TTATCTGTGC AGAATATATT 
CTAATATATT CTCTTCCTAT 
CATGATTTAC TCATTAAACT 
ATTCTGGTCA CTAAATATAC 
TGATTGCTAA TTTACATAGA 
AATGAT CTGT GCTCTGCAAA 
CATTTAGTCC TCAAAATATA 
TTTAAAGGTT TTGACCATTT 
AAATTGCACT TTTATTTTTT 
TGGAGAAACA ATAAAAGATT 



PCT/US02/12476 



TTAAGTTGTA 
TCCTTATTCA 
GGTTTTAGAT 
TTGATTTTGT 
ACTTTAGATA 
AATGTATTCT 
GTTTTGAAAA 
TACAGCATTG 
TGTTATGAGG 
CCTGTGTGTC 
TCTAAACCAA 



CTGTATTAGA 
GAATTTCTAA 
GTTTGATGTC 
ATGCTATTTT 
GATGAAGAAG 
CTTGGTTTTT 
TATATTTGAA 
CTAAGATTTT 
AATTATACAT 
ATGTTGGTTT 
AAAAAAAAAA 



ACACTGGGTG 
AAATTTAAGT 
TTCTTAGTAT 
TTCACTATAG 
CCCAAAAACA 
TAAATAAAAG 
CAATTTGAAT 
CAGATATCTA 
GTATCACATT 
TTGGTACTTG 
AAAAAAA 



TGTCATACCG 960 

TCTGTAAGGG 1020 

GGCATAATGT 1080 

GATGACTATA 1140 

GATAAATTCC 1200 

CAAAATTAAC 1260 

ATAAATTCAT 1320 

TTGTGGATCT 13 80 

CACTATATTA 1440 

TATTGTCATT 1500 



15 



20 



25 



30 



35 



40 



Seq ID NO: 641 Protein sequence 
Protein Accession #: NP__002984.1 

1 11 21 31 41 51 

l I I l I l 

MSLPSSRAAR VPGPSGSLCA LLALLLLLTP PGPLASAGPV SAVLTELRCT CLRVTLRVNP 
KTIGKLQVFP AGPQCSKVEV VASLKNGKQV CLDPEAPFLK KVIQKILDSG NKKN 

Seq ID NO: 642 DNA sequence 

Nucleic Acid Accession #: NM_013271.1 

Coding sequence: 27.. 80 9 ' 



TCCGGAGCCA 
CCGGGGGCGT 
TCTGCGCGCG 
AGACTGGCGC 
TGCAGGAGCT 
GGGCCGAGGC 
TCTGGGGCGC 
CTGCAGCGCA 
CCCAGCTTGT 
ACGACGGCCC 
CCGAGCTGTT 
TGGCAGCCCC 
CTGAGGGCGT 
TGCCTGCACG 
CAGAAGTGCC 
TTACCCCGGC 
GATCTGAGC 



11 
1 

GGCTCGCTGG 
CGGCCTTTTG 
GCCGGTAAAG 
TCCTCGCCGC 
GGCGCGGGCG 
GCAGGAGGCT 
CCCCCGCAAC 
GCTCGCTCGC 
CCCCGCGCCC 
CGCGGGCCCG 
GAGGTACTTG 
GCGCCGCCTC 
GCTGGGGGCG 
CCGCCTCTTG 
CCCGCCATCC 
CAGCCAGCCC 



21 

1 

GGCAGCATGG 
GTGCTGCTGC 
GAACCCCGCG 
TTCCGGCGGT 
CTGGCGCATC 
GAGGATCAGC 
TCTGATCCGG 
GCTCTGCTCC 
GTCCCCGCCG 
GATGCTGAGG 
CTGGGACGGA 
CGCCGTGCCG 
CTGCTGCGTG 
CCACCCTGAG 
CGCCACCAGG 
TCTCACCCGA 



31 
I 

CGGGGTCGCC 
TGCTCGGCCT 
GCCTAAGCGC 
CAGTGCCCCG 
TGCTGGAGGC 
AGGCGCGCGT 
CTCTGGGCCT 
GCGCCCGCCT 
CGGCGCTCCG 
AGGCAGGCGA 
TTCTTGCGGG 
CCGACCACGA 
TGAAACGCCT 
CACTGCCCGG 
ACTTCTCCCC 
GGATCCCTAC 



41 
I 

GCTGCTCTGG 
GTTTCGGCCG 
AGCGTCTCCG 
AGGTGAGGCG 
CGAACGTCAG 
CCTGGCGCAG 
GGACGACGAC 
TGACCCTGCC 
ACCCCGGCCC 
CGAGACACCC 
AAGCGCGGAC 
TGTGGGCTCT 
AGAGACCCCG 
ATCCCGTGCA 
GCCAGCACGT 
CCCCTGGCCC 



51 
I 

GGGCCGCGGG 
CCCCCCGCGC 
CCCTTGGCTG 
GCGGGGGCGG 
GAGCGGGCGC 
CTGCTGCGCG 
CCCGACGCGC 
GCCCTAGCAG 
CCGGTCTACG 
GACGTGGACC 
TCCGAGGGGG 
GAGCTGCCCG 
GCGCCCCAGG 
CGCTGGGACC 
CCAGAGCAAC 
ACAATAACAT 



60 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 



45 



Seq ID NO: 643 Protein sequence 
Protein Accession #: NP 037403.1 



50 



55 



60 



65 



70 



75 



80 



1 11 21 31 41 51 

I I I I I I 

MAGSPLLWGP RAGGVGLLVL LLLGLFRPPP ALCARPVKEP RGLSAASPPL AETGAPRRFR 

RSVPRGEAAG AVQELARALA HLLEAERQER ARAEAQEAED QQARVLAQLL RVWGAPRNSD 

PALGLDDDPD APAAQLARAL LRARLDPAAL AAQLVPAPVP AAALRPRPPV YDDGPAGPDA 

EEAGDETPDV DPELLRYLLG RILAGSADSE GVAAPRRLRR AADHDVGSEL PPEGVLGALL 

RVKRLETPAP QVPARRLLPP 

Seq ID NO: 644 DNA sequence 
Nucleic Acid Accession #: NM_002214 
Coding sequence: 681.. 2990 



85 



i 
I 

CCCAGAGCCG 
CTGCCGACTT 
GTTGGCCTCC 
TCCCCTCGAC 
TAGGGTGGTT 
CTAAGCTGAT 
TGTCCCGGAG 
TGGCCGTCGA 
GGCCGTAGGG 
CCGAGCCGCG 
GGCCCCGAGG 
GGGGCGGGCT 
TCTGCCTGCA 
CACTTGTTCT 
CCTGTGCCAG 
TTTCAGGTGG 
GCTCAGTTGA 
TTAATACCCA 
ATTTTATGCT 
ATGTCTCAGC 
CTAGAAAAAT 
AAACAGTTTC 
ACAATTTAGA 
TCACTGAGTT 
AAGGAGGTTT 
AAGAGGCTAA 



11 

I 

CCTCCCCCTG 
GTCTTTGCCC 
CTGCCCACCT 
CTCGCCGGCG 
TCCCCCCCAG 
TTATGCAGCA 
CAGGCTGCGG 
AGGAGGTGCT 
GCCCTGAGAT 
GGGTCCGCCT 
TCGCCCGGGA 
GTTTTGCATT 
AAACGACCGG 
TGGACTGGGC 
GTGCCTTGCG 
ATCAAGAAGT 
TTCAATAGAA 
GGTGACACCA 
GAAAGTTCAT 
ATCAATGCAC 
GGCATTTTTC 
ACCATACATT 
CTGCATGCCT 
TGAGAAAGCA 
TGACGCCATG 
AAGATTGCTG 



21 
I 

TTGCTGGCAT 
GCTGCTCCGC 
GTGGAAGCAA 
TACCCTCCCA 
CTTCGGGCTT 
GAAGCCCCAC 
AGCCCTTGCA 
TCTCGCGGAG 
GCCGAGCGGT 
GCTAGGCCTG 
GGCCGAGCCC 
ATGTGCGGCT 
CGAGGTCCCG 
CAAGGTGAAG 
CTGGGTCCAG 
GAACGTTGTG 
TACCCATCTG 
GGAGAAGTGT 
CCTCTGAAGA 
AATAATATAG 
TCCCGTGACT 
AGCATCCACC 
CCCCATGGAT 
GTTCATAGAC 
CTTCAGGCAG 
CTGGTGATGA 



31 
I 

CCCGAGCTTC 
AGACGGGGCT 
CTGCGCTGAT 
CAGATCCAGC 
TGTTTGGGTT 
CGGCTGGAGA 
GAGCCCTCTC 
ACCGCGGGAC 
GCCCGGGCCC 
CGGAAAACGT 
GCGTCCGGAA 
CGGCCCTGGC 
CCTCGTTCCT 
ACAATAGATG 
AATGTGGATG 
ATATTGTTTC 
TGCATGTTAT 
CTATCCAGCT 
AATATCCTGT 
AAAAATTAAA 
TTCGTCTTGG 
CCGAAAGGAT 
ACATCCATGT 
AGAAGAT CTC 
CTGTCTGTGA 
C AG AT CAG AC 



41 



CTCCCTTGCC 
GCAAAGCTGC 
TGATGCGCCA 
ATCACCCAGT 
TGATTGTGTT 
GAAACAAAAG 
TCCAGTCGCC 
CCGCCGTGCC 
GCTTACCTGC 
CCTAGCGACA 
GGCAGCCAGG 
TTTTTTTACC 
CTGGGCAGCC 
TGCATCTTCA 
GTGTGTTCAA 
CAATTTAATA 
AATACCCACT 
GCGTCCAGGA 
GGATCTTTAT 
TTCCGTTGGA 
ATTTGGCTCA 
TCATAATCAA 
GCTGTCTTTG 
TGGAAACATA 
AAGTCATATC 
GTCTCATCTC 



51 
I 

AGCCAGGACG 
AACTAATGGT 
CAGACTTTTT 
GAATGTACAT 
TGGCTCTTCG 
CTCTTTTCTT 
GCCGGGCCCT 
GAGCCGGGAG 
ACCGCTTGCT 
CTCGCCCGCG 
CGGCGGGCGC 
GCTGCATTTG 
TGGGTGTTTT 
AATGCAGCAT 
GAGGATTTCA 
AGCAAAGGCT 
GAAAATGAAA 
GCCGAAGCTA 
TATCTTGTTG 
AACGATTTAT 
TACGTTGATA 
TGCAGTGACT 
ACAGAGAACA 
GATACACCAG 
GGATGGCGAA 
GCTCTTGATA 



60 
120 
180 
240 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 



432 



10 



15 



20 



25 



30 



35 



40 



45 



50 



WO 02/086443 

GCAAATTGGC AGGCATAGTG 
ACGTCAAATC GACAACCATG 
ACAACAACAT TAATGT CATC 
TTCTACCCCT CTTGCCAGGC 
ATAATTTGGT AGTGGAAGCC 
ACCAGGTACA AGGCATCTAT 
CAGGCATGGA AGGATGCAGA 
TTACAATGAA AAAATGTGAT 
GTTTTAATGA AACCGCTAAA 
ACAGAGGACC TAAAGGAAAG 
GTGATGAGAA TAAATGTCAT 
ACAAGGATCA GCCTGTTTGC 
ACAAAATTAA GCTTGGAAAA 
CATATCACCA TGGAAATCTG 
GCTTCAGTGG CTGGGAAGGT 
TCAATTCAAA GGGCCAAGTG 
GCACCGATCC CAGGAGCATC 
GCAAGGAAAA CTGGAATTGT 
TTGATCAGTG CAAAACCTCA 
CAGAATGTTT CTCCAGCCCA 
TCTTGATTGG GTTGCTTAAA 
ATAAAATTAA GTCCTCATCA 
TGCAAAGTGT TTGCACAAGA 
TGGATATCAG CAAATTAAAT 
TTAAACACTT AATGGGAAAC 
AAGT CACAGG AGGAGACAAA 
GAAGACTGAC AAGTATCCTC 
AAAATGTGTC TTACTACTGT 
ACTTATTTAG AT C AG CAT AG 
TACCTGTTAT CCCTACGCTT 
CACTACAAGG GTACAGTAAT 
TATATTCTAA GGTTGCCAAA 
ATGAATAAAT GATTCGTGTT 
AAAGATTATT GCTTTTTAAA 
TTTGCAAGAT GGATACTAAT 
TTTTTACAGG ATAAGTTTAT 
TACTGCCATA AAAAACTAAT 
GAATGTTAA 
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GTGCCCAATG 
GAACACCCCT 
TTTGCAGTTC 
ACCATTGCTG 
TATCAGAAGC 
TTTAACATTA 
AACGTGACGA 
GT CACAGG AG 
ATTCATATAC 
TGTGTAGATG 
TTTGATGAAG 
AGTGGTCGAG 
GTGTATGGAA 
TGTGCTGGGC 
GATCGATGCC 
TGCAGTGGAA 
GGCCGCTTCT 
ATGCAATGCC 
TGTGCTCTCA 
AGCTACTTGA 
GTCCTGATCA 
GATTACAGAG 
GCAGTCACCT 
GCTCATGAAA 
TGGAATTGTT 
TTGCTCACGG 
AT CATGATGT 
TTGAGACTAG 
AATGTAGATC 
CCCAGAGAGA 
CCCTGCACTG 
CACTTCAACA 
TCACTCTTTC 
GTGTGTAGTT 
TCCAGCATTC 
GTATGTCACA 
AATACAATGT 



ACGGAAACTG 
CACTAGGCCA 
AAGGAAAACA 
GTGAAATAGA 
TCATTTCAGA 
CCGCCATCTG 
GCAATGATGA 
GAAAAAACTA 
ACAGAAACTG 
AAACTTTTCT 
ATCAGTTTTC 
GAGTTTGTGT 
AATACTGTGA 
ATGGAGAGTG 
AGTGCCCTTC 
GAGGCACGTG 
GTGAACACTG 
TTCACCCTCA 
TGGAACAACA 
GAATATTTTT 
TTAGACAGGT 
TGTCAGCCTC 
ACCGACGTGA 
CTTTCAGGTG 
AATAATTGCT 
TCATGCCAGT 
GACTCACATA 
TGTCGTTGTA 
CTCTGAAGAG 
ACAATGCTGT 
GACATGTGAG 
GTTGGTGGTT 
AAGAGGTGAA 
TTATGCATGT 
TCTCCTCTTT 
GATGACTGGA 
CACTTTATCA 



TCATCTGAAA 
ACTTTCAGAG 
ATTTCATTGG 
ATCAAAGGCT 
AGTGAAAGTT 
TCCAGATGGG 
AGTTCTTTTC 
TGCAATAATC 
CAGCTGT CAG 
AGATTCCAAG 
TTCTGAGAGT 
TTGTGGGAAA 
AAAGGATGAC 
TGAAGCAGGC 
AGCAGCAGCC 
TGTGTGTGGA 
CCCCACCTGT 
CAATTTGTCT 
GCATTATGTC 
CATCATTTTC 
GATACTACAA 
AAAAAAGGAT 
GAAGCCTGAA 
CAACTTCTAA 
CCTAAAGATT 
TGCTGGTTGT 
GCTGCTGACT 
GCACTTTACT 
CACTGATTAC 
GAGAGAGTTT 
GAAAAAAATA 
GAATAGACAA 
CAGATACAAC 
GTGTTTATGG 
GCCTTTATGT 
TTAATTAAGT 
GAATACTAGT 



AACAACGTCT 
AAATTAATAG 
TATAAGGATC 
GCAAACCTCA 
CAGGTGGAAA 
TCCAGAAAGC 
AATGTAACAG 
AAACCTATTG 
TGTGAGGACA 
TGTTTCCAGT 
TGCAAGTCAC 
TGTTCATGTC 
TTTTCTTGTC 
AGATGCCAAT 
CAGCACTGTG 
AGGTGTGAGT 
TATACAGCCT 
CAGGCTATAC 
GACCAAACTT 
ATAGTTACAT 
TGGAATAGTA 
AAGTTGATTC 
GAAATAAAAA 
AAAAAGATTT 
ATAATTTTAA 
ACACTCGAAC 
TTTT CAGAGA 
GTAATATATA 
ACTTTACAGG 
AGCATTGTGT 
ATCTGGCAAG 
GAACAGCTAG 
CTTAATCTTA 
TTTGCTTATT 
TTTGTTTTCT 
GCTAAGTTAC 
TTTAAAAGCT 



Seq ID NO: 645 Protein, sequence 
Protein Accession #: NP_002205 



55 



MCGSALAFFT 
LGPECGWCVQ 
GEVSIQLRPG 
SRDFRLGFGS 
VHRQKISGNI 
VPNDGNCHIjK 
TIAGEIESKA 
NVTSNDEVLF 
CVDETFLDSK 
VYGKYCEKDD 
CSGRGTCVCG 
CALMEQQHYV 
DYRVSASKKD 



11 
I 

AAFVCLQNDR 
EDFISGGSRS 
AEANFMLKVH 
YVDKTVSPYI 
DTPEGGFDAM 
NNVYVKSTTM 
ANLNNLWEA 
NVTVTMKKCD 
CFQCDENKCH 
FSCPYHHGNL 
RCECTDPRSI 
DQTSECFSSP 
KLILQSVCTR 



21 

i 

RGPASFLWAA 
ERCDIVSNLI 
PLKKYPVDLY 
SIHPERIHNQ 
LQAAVCESHI 
EHPSLGQLSE 
YQKLISEVKV 
VTGGKNYAI I 
FDEDQFSSES 
CAGHGECEAG 
GRFCEHCPTC 
SYLRIFFIIF 
AVTYRREKPE 



31 
I 

WVFSLVLGLG 
SKGCSVDSIE 
YLVDVSASMH 
CSDYNLDCMP 
GWRKEAKRLL 
KLIDNNINVI 
QVENQVQGIY 
KPIGFNETAK 
CKSHKDQPVC 
RCQCFSGWEG 
YTACKENWNC 
IVTFLIGLLK 
EIKMDISKLN 



41 

I 

QGEDNRCASS 
YPSVHVIIPT 
NNIEKLNSVG 
PHGYIHVLSL 
LVMTDQTSHL 
FAVQGKQFHW 
FNITAICPDG 
IHIHRNCSCQ 
SGRGVCVCGK 
DRCQCPSAAA 
MQCLHPHNLS 
VLIIRQVILQ 
AHETFRCNF 



51 
I 

NAASCARCLA 
ENEINTQVTP 
NDLSRKMAFF 
TENITEFEKA 
ALDSKLAGIV 
YKDLLPLLPG 
SRKPGMEGCR 
CEDNRGPKGK 
CSCHKIKLGK 
QHCVNSKGQV 
QAILDQCKTS 
WNSNKIKSSS 



1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 



Seq ID NO: 646 DNA sequence 
60 Nucleic Acid Accession #: NM_0 03 318.1 
Coding sequence 1..2574 



65 



70 



75 



80 



85 



ATGGAATCCG 
AGAGACATTA 
ATTTCTGCTG 
AACCCAGAGG 
GATGCTCTTT 
GATAAATATG 
GCTATTCAAG 
AAATTTGCTT 
AAAAGTAAAC 
GAAATTGCCC 
AAGAATTTAT 
CATTTACAGA 
TTATATGGAG 
CAAACTAACA 
AGCCCAGATT 
ACCTCTAGAT 
TCCTGTGAAT 
T CAG ATG AAA 
GAATCAAGTC 
GAGAGTAACC 
GCTGCATCTT 
AAACATACCA 
ACATCTAAAT 



11 
I 

AGGATTTAAG 
AAAATAAGTT 
ATACTACAGA 
ACTGGTTGAG 
TAAATAAATT 
GCCAAAATGA 
AGCCAGATGA 
TTGTTCATAT 
AACTTCTTCA 
TGCGGAATTT 
CAGCATCTAC 
ATAGGAACAA 
AGAACATGCC 
AAACTAAACA 
GTGATGTGAA 
CAGAATGCCG 
TAAGAAATTT 
AGAGTT CTG A 
TTCTAGCTAA 
AGAAACAGTG 
CAAATCACTG 
CTTTTGAGCA 
GGTTTGACCC 



21 
I 

TGGCAGAGAA 
TAAAAATGAA 
TAACTCGGGA 
TTTGTTGCTC 
GATTGGTCGT 
GAGTTTTGCT 
TGCACGTGAC 
ATCTTTTGCA 
AAAAGCTGTA 
AAACCTCCAA 
GGTATTAACT 
CAGTTGTGAT 
ACCACAAGAT 
GTCATGCCCA 
GACAGATGAT 
AGATTTGGTT 
AAAGTCTGTT 
ACTTATTATT 
ATTAGAAGAA 
GCAATCTAAG 
GCAGATTCCG 
ACCTGTCTTT 
AAAATCTATT 



31 
I 

TTGACAATTG 
GACCTTACTG 
ACTGTTAACC 
AAACTAGAGA 
TACAGTCAAG 
AGAATTCAAG 
TACTTTCAAA 
CAATTTGAAC 
GAACGTGGAG 
AAAAAGCAGC 
G CCCAAGAAT 
TCCAGAGGAC 
GCAGAAATAG 
TTTGGAAGAG 
TCAGTTGTAC 
GTGCCTGGAT 
CAAAATAGTC 
ACTGATTCAA 
ACTAAAGAGT 
AGAAAGTCAG 
GAGTTAGCCC 
TCAGTTTCAA 
TGTAAGACAC 



41 



51 



ATTCCATAAT 
ATGAACTAAG 
AAATTATGAT 
AAAACAGTGT 
CAATTGAAGC 
TGAGATTTGC 
TGGCCAGAGC 
TGTCACAAGG 
CAGTACCACT 
TGCTTTCAGA 
CATTTTCCGG 
AGACTACTAA 
GTTACCGGAA 
TCCCAGTTAA 
CTTGTTTTAT 
CTAAACCAAG 
ATTTCAAGGA 
TAACCCTGAA 
ATCAAGAACC 
AGTGTATTAA 
GAAAAGTTAA 
AACAGTCACC 
CAAGCAGCAA 



GAACAAAGTG 60 

CTTGAATAAA 120 

GATGGCAAAC 180 

TCCGCTAAGT 240 

GCTTCCCCCA 300 

TGAATTAAAA 360 

AAACTGCAAG 420 

TAATGTCAAA 480 

AGAAATGCTG 540 

GGAGGAAAAG 600 

TTCACTTGGG 660 

AGCCAGGTTT 720 

TTCATTGAGA 780 

CCTTCTAAAT 840 

GAAAAGACAA 900 

TGGAAATGAT 960 

ACCTCTGGTG 1020 

G AATAAAACG 1080 

AGAGGTTCCA 1140 

CCAGAATCCT 12 00 

TACAGAGCAG 1260 

ACCAATATCA 132 0 

TACCTTGGAT 1380 



433 



10 



15 



20 



WO 02/086443 

GATTACATGA GCTGTTTTAG 
TTGTCAACAC CTTATGGCCA 
ACTCCACTTC AAAATTTACA 
AAAGGAAGAA TTTATTCCAT 
CAGGTGTTAA ATGAAAAGAA 
GATAACCAAA CTCTTGATAG 
CACAGTGATA AGATCATCCG 
GTAATGGAGT GTGGAAATAT 
CCATGGGAAC GCAAGAGTTA 
CATGGCATTG TTCACAGTGA 
AAGCTAATTG ATTTTGGGAT 
GATTCTCAGG TTGGCACAGT 
TCCAGAGAGA ATGGGAAATC 
GGATGTATTT TGTACTATAT 
ATTTCTAAAT TACATGCCAT 
GAG AAAGAT C TTCAAGATGT 
TCCATTCCTG AGCTCCTGGC 
ATGGCCAAGG GAACCACTGA 
TCTCCTAACT CCATTTTGAA 
AGTCATAATT CTTCATCCTC 



PCT/US02/12476 



AACTCCAGTT 
ACCTGCCTGT 
GGTTTTAGCA 
TTTAAAGCAG 
ACAGATATAT 
TTACCGGAAC 
ACTTTATGAT 
TGATCTTAAT 
CTGGAAAAAT 
TCTTAAACCA 
TGCAAACCAA 
TAATTATATG 
TAAGTCAAAG 
GACTTACGGG 
AATTG AT CCT 
GTTAAAGTGT 
TCATCCCTAT 
AGAAATGAAA 
AGCTGCTAAA 
CAAGACTTTT 



GTAAAGAATG 
TTCCAGCAGC 
TCTTCTTCAG 
ATAGGAAGTG 
GCTATAAAAT 
GAAATAGCTT 
TATGAAATCA 
AGTTGGCTTA 
ATGTTAGAGG 
GCTAACTTTC 
ATGCAACCAG 
CCACCAGAAG 
ATAAGCCCCA 
AAAACACCAT 
AAT CATGAAA 
TGTTTAAAAA 
GTTCAAATTC 
TATGTTCTGG 
ACTTTATATG 
GAAAAAAAAA 



ACTTTCCACC 
AACAGCATCA 
CAAATGAATG 
GAGGTT CAAG 
ATGTGAACTT 
ATTTGAATAA 
CGGACCAGTA 
AAAAGAAAAA 
CAGTTCACAC 
TGATAGTTGA 
ATACAACAAG 
CAATCAAAGA 
AAAGTGATGT 
TT CAGCAGAT 
TTGAATTTCC 
GGGACCCAAA 
AAACTCATCC 
GCCAACTTGT 
AACACTATAG 
GGGGAAAAAA 



TGCTTGTCAG 1440 

AATACTTGCC IS 00 

CATTTCGGTT 1560 

CAAGGTATTT 1620 

AGAAGAAGCA 1680 

ACTACAACAA 1740 

CATCTACATG 1800 

ATCCATTGAT 1860 

AATCCATCAA 192 0 

TGGAATGCTA 1980 

TGTTGTTAAA 2040 

TATGTCTTCC 2100 

TTGGTCCTTA 2160 

AAT T AAT CAG 222 0 

CGATATTCCA 22 8 0 

ACAGAGGATA 2340 

AGTTAACCAA 2400 

TGGT CTGAAT 2460 

TGGTGGTGAA 2520 
ATGA 



Seq ID NO: 64 7 Protein sequence 
Protein Accession #: NP 003309.1 



25 



30 



35 



40 



1 

MESEDLSGRE 
NPEDWLSLIiL 
AIQEPDDARD 
EIALRNIiNLQ 
LYGENMPPQD 
TSRSECRDLV 
ESSLLAKLEE 
KHTTFEQPVF 
LSTPYGQPAC 
QVLNEKKQIY 
VMECGNIDLN 
KLIDFGIANQ 
GCILYYMTYG 
SIPEIiLAHPY 
SHNSSSSKTF 



11 
I 

LTIDSIMNKV 
KLEKNSVPLS 
YFQMARANCK 
KKQLLSEEEK 
AEIGYRNSLR 
VPGSKPSGND 
TKEYQEPEVP 
SVSKQSPPIS 
FQQQQHQILA 
A I K YVNLEEA 
SWLKKKKSID 
MQPDTTSWK 
KTPFQQIINQ 
VQIQTHPVNQ 
EKKRGKK 



21 
I 

RDIKNKFKNE 
DALLNKLIGR 
KFAFVHISFA 
KNLSASTVLT 
QTNKTKQSCP 
SCELRNLKSV 
ESNQKQWQSK 
TSKWFDPKSI 
TPLQNLQVLA 
DNQTIiDSYRN 
PWERKSYWKN 
DSQVGTVNYM 
ISKLHAIIDP 
MAKGTTEEMK 



31 
I 

DLTDELSLNK 
YSQAIEALPP 
QFELSQGNVK 
AQESFSGSLG 
FGRVPVNLLN 
QNSHFKEPLV 
RKSECINQNP 
CKTPSSNTLD 
SSSANECISV 
EIAYLNKLQQ 
MIiEAVHTIHQ 
PPEAIKDMSS 
NHEIEFPDIP 
YVLGQLVGLN 



41 
I 

ISADTTDNSG 
DKYGQNESFA 
KSKQLLQKAV 
HLQNRNNSCD 
SPDCDVKTDD 
SDEKSSELII 
AASSNHWQIP 
DYMSCFRTPV 
KGRIYSILKQ 
HSDKIIRLYD 
HGIVHSDLKP 
SRENGKSKSK 
EKDLQDVLKC 
SPNSILKAAK 



51 

I 

TVNQIMMMAN 60 

RIQVRFAELK 120 

ERGAVPLEML 180 

SRGQTTKARF 240 

SWPCFMKRQ 300 

TDSITLKNKT 360 

EDARKVNTEQ 42 0 

VKNDFPPACQ 480 

IGSGGSSKVF 540 

YEITDQYIYM 600 

ANFLIVDGML 660 

ISPKSDVWSL 720 

CLKRDPKQRI 780 

TLYEHYSGGE 840 



Seq ID NO: 648 DNA sequence 
Nucleic Acid Accession #: NM_015507 
45 Coding sequence: 241.. 1902 



50 



55 



60 



65 



70 



75 



80 



85 



CCGCAGAGGA 
CGCCCCTGCC 
CGAGTGGAGC 
GGGTCCGGCC 
ATGCCTCTGC 
GGGAACGCGG 
TGTCACTATG 
TGTGAAGCTA 
AGATGCTTTC 
AAACCCCGGC 
CTCAGTGGCC 
ATAAACTGTC 
TCAGGACTCC 
GGTAAAGTCA 
AAATGTCACA 
AATGAATGTA 
GGGTCCTTCA 
ATCCCTGAAA 
AAGAAGTTGC 
CCAGAACCCA 
ATAGTTTCCA 
GAGGGGCTTG 
AGCCTGCGAG 
CTGGTCCAAA 
GACTGCAGCT 
TGGAATCCTG 
GGTCACAAGA 
AACTTCTGTT 
TTTGTGAAAA 
TGGAAGACAG 
GAAGCAGAAC 
TCAGGCTTAT 
TTGACTTTGT 
TTAGAATTAC 
TCTTGTATAA 
TTTCTGAATC 
CAGT AT AT CT 
TAGAAAAAAA 
TATGACATCA 



11 
I 

GCCTCGGCCA 
GCGGTGCCTG 
GGAGGACCCG 
GGCGCCCTCC 
CCTGGAGCCT 
CCAGTGCAAG 
GAACTAAACT 
CAT G CG AACC 
CAGGATACAC 
CATGCCAACA 
ACATGCTCAT 
AGTACAGCTG 
GCCTGGCCCC 
TCTGTCCCTA 
TTGGTTTCGA 
CTATGGATAG 
AGTGTAAATG 
ATTCTGTGAA 
TTGCTCACAA 
CCAGGACTCC 
GAGGCGGGAA 
AGGATGAGAA 
GAG ATGTGT T 
GGAAAGCGCT 
TCAATCATGG 
CTG AT CGAG A 
AAGACATTGG 
TGCTCTTTGA 
ACAGTAACAA 
GGAAAATTCA 
GTGGCAAGGG 
GT C CAG AT AG 
ATGTCAGTTC 
TAG C T G AAAA 
GATATGCCAA 
TTTCCACATT 
GATTTGTATA 
AG CACAG AG A 
AAGATAGACT 



21 

I 

GGCTAGCCAG 
GCCTCCCCTC 
AGCGGCTGAG 
CGAGGGGGGC 
TGCGCTCCCG 
G CAT C ACGGG 
GGCCTGCTGC 
TGGATGTAAG 
CGGGAAAACC 
CAGATGTGTG 
GCCAGATGCT 
TGAAGACACA 
AAATGGAAGA 
CAATCGAAGA 
ACTGCAATAT 
CCATACGTGC 
CAAGCAGGGA 
GGAAGTCCTC 
AAACAGCATG 
TACCCCTAAG 
CTCT CATGGA 
AAGAGAAGAG 
TTTCCCTAAG 
AACTTCCAAA 
GATCTGTGAC 
TAATGCTATT 
CCGATTGAAA 
TTACCGGCTG 
TGCCCTGGCA 
GTTGTATCAA 
CAAAACCGGC 
CCTTTTATCT 
CCTGGTTTTT 
ATTGTAATGT 
TATTTGCTTT 
AT AT TAT AAA 
AGTAAGTTGA 
AATGTTTAAC 
TTTGCCTAAG 



31 



GGCGCCCCCA 
CCAGACTGCA 
GAGAGAGGAG 
TCAGGAGGAG 
CTGCTGCTCT 
TTGTTAGCAT 
TACGGCTGGA 
TTTGGTGAGT 
TGCAGTCAAG 
AATACACACG 
ACGTGTGTGA 
GAAGAAGGGC 
GACTGT CT AG 
TGTGTGAACA 
ATCAGTGGAC 
AGCCACCATG 
TATAAAGGCA 
AGAGCACCTG 
AAAAAGAAGG 
GTGAACTTGC 
GGTAAAAAAG 
AAAGCCCTGA 
GTGAATGAAG 
CTGGAACATA 
TGGAAACAGG 
GGCTTCTATA 
CTTCTCCTAC 
GCCGGAGACA 
TGGGAGAAGA 
GGAACTGATG 
GAAAT CGCAG 
GTGGATGACT 
TTGATATTGC 
ACCAACAGAA 
AAATATCATA 
ATATGGAAAT 
TGAGCTTCTC 
TGTTTGACTC 
TGGCTTAGCT 



41 
i 

GCCCCTCCCC 
GGGACAGCAC 
GCGGCGGCTT 
GAAGGAGGAC 
CCTGGGTGGC 
CGGCACGTCA 
GAAGAAACAG 
GCGTGGGACC 
ATGTGAATGA 
GAAGCTACAA 
ACTCTAGGAC 
CACAGTGCCT 
ATATTGATGA 
CATTTGGAAG 
GATATGACTG 
CCAATTGCTT 
ATGGACTTCG 
GTACCATCAA 
CAAAAATTAA 
AGCCCTTCAA 
GGAATGAAGA 
AGAATGACAT 
CAGGTGAATT 
AAGATTTAAA 
ATAGAGAAGA 
TGGCAGTTCC 
CTGACCTGCA 
AAGTCGGGAA 
CCACGAGTGA 
CTACCAAAAG 
TGGATGGCGT 
GAATGTTACT 
ATCATAGGAC 
ATATTATTGT 
TCACTGTATC 
GTCAGTTTAT 
TCTACAACAT 
TTATGATACT 
GGGTCTTTCA 



51 



AGGCCGCGAG 60 

CCGGTAACTG 12 0 

AGCTGCTACG 180 

CCGTGCGAGA 240 

AGGTGGTTTC 300 

GCCTGGGGTC 3 60 

CAAGGGAGTC 42 0 

AAACAAATGC 480 

GTGTGGAATG 540 

GTGCTTTTGC 600 

ATGTGCCATG 660 

GTGTCCATCC 72 0 

ATGTGCCTCT 780 

CTACTACTGC 840 

TATAGATATA 900 

CAATACCCAA 960 

GTGTTCTGCT 1020 

AGACAGAATC 1080 

AAATGTTACC 1140 

CTATGAAGAG 1200 

GAAAATGAAA 1260 

AGAGGAGCGA 132 0 

CGGCCTGATT 1380 

TATCTCGGTT 1440 

TGATTTTGAC 150 0 

GGCCTTGGCA 1560 

ACCCCAAAGC 1620 

ACTTCGAGTG 1680 

GGATGAAAAG 1740 

CATCATTTTT 1800 

CTTGCTTGTT 1860 

AT CTTT ATAT 192 0 

CTCTGGCATT 1980 

AAGATGCCTT 2040 

TTCTCAGTCA 2100 

CTCCCCTCCT 2160 

TTCTAGAAAA 2220 

TCTTGGAAAC 2280 

TAGCCAAACT 2340 



434 



WO 02/086443 

TGTATATTTA AATTCTTTGT AATAATAATA TCCAAATCAT CAAAAAAAAA AAAAAAAA 



PCT/US02/12476 



Seq ID NO: 64 9 Protein sequence 
Protein Accession #: NP_056322 



10 



15 



20 
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30 



35 
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50 



55 



60 
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70 



75 



i 
I 

MPLPWSLALP 
CEATCEPGCK 
LSGHMLMPDA 
GKVICPYNRR 
GSFKCKCKQG 
PEPTRTPTPK 
SLRGDVPFPK 
WNPADRDNAI 
FVKNSNNALA 
SGLCPDSLLS 



11 

I 

LLLSWVAGGF 
FGECVGPNKC 
TCVNSRTCAM 
CVNTFGSYYC 
YKGNGLRCSA 
VNLQPFNYEE 
VNEAGEFGLI 
GFYMAVPALA 
WEKTTSEDEK 
VDD 



21 

1 

GNAASARHHG 
RCFPGYTGKT 
INCQYSCEDT 
KCHIGFELQY 
IPENSVKEVL 
I VSRGGNSHG 
LVQRKALTSK 
GHKKDIGRLK 
WKTGKIQLYQ 



31 
I 

LLASARQPGV 
CSQDVNECGM 
EEGPQCLCPS 
ISGRYDCIDI 
RAPGTIKDRI 
GKKGNEEKMK 
LEHKDLNISV 
LLLPDLQPQS 
GTDATKSIIF 



41 
I 

CHYGTKLACC 
KPRPCQHRCV 
SGLRLAPNGR 
NECTMD SHTC 
KKLLAHKNSM 
EGLEDEKREE 
DCSFNHGI CD 
NFCLLFDYRL 
EAERGKGKTG 



51 
I 

YGWRRNSKGV 
NTHGSYKCFC 
DCLDIDECAS 
SHHANCFNTQ 
KKKAKIKNVT 
KALKNDIEER 
WKQDREDDFD 
AGDKVGKLRV 
EIAVDGVIiLV 



Seq ID NO: 650 DNA sequence 

Nucleic Acid Accession #: iJM_003 506.1 

Coding sequence: 259.-2379 



80 



GCAGCTCCAG 
TTAGACGGGG 
CTCATTTTCA 
ATCTTTGGAT 
ATCAGGAATT 
CTCCTAAGAG 
ATGGCCTACA 
GCGGTGGAAA 
ACTTTCCTCT 
TGTCGTAAAC 
ATCCGATGGC 
GTAACTTTTG 
AGAGACATTG 
TTTCTGGGAA 
CTAGAGTTTG 
TTCACATTCC 
ATATATTACT 
GGCGATAGCA 
CTAGGCTCTC 
GCTGGCACTG 
TGGAGTTGTG 
CCAGGTTTCC 
GGAGTTTGCT 
CTGTGCCTTT 
CATGTTCGAC 
ATTCGAATTG 
TACGTCTATG 
CGTCAGTACC 
TTATTTATGA 
GGAAGCAAAA 
CCAATCAGTG 
TCTAAAGTTA 
TCCAAATCCA 
ATTACTAGCC 
ACAT CAATGA 
TGTGGTGAAC 
GGGAAGGGCC 
AAGAGTGATA 
TCAGAACCAA 
AGAAAAGAGC 
CAGAAGCAAA 
TACGTTCTTC 
TCAAGAATAA 
AAATGTGCAG 
CCTTTTCTAT 
TTTACCTTTT 
GTATCTTTTT 
ATTCAAGTAT 
ATTTCTAAGA 
GTCTTATAAT 
TGTGATTTTT 
GGTGCTTACT 
ATATTTAAAA 
GGCCAAGTGC 
AACCACTTAC 
TACATTTTGT 



11 
I 

TCCCGGACGC 
ACGGGAAGGG 
GGAAAGCCTG 
GGGGATCTTC 
TGAAGAAAAT 
GGCACAGTCT 
ACATGACGTT 
TGGAGCATTT 
GCAAAGCATT 
TTTGTGAGAA 
CTGAGGAGCT 
ATCCACACAC 
GATTTTGGTG 
TTGACCAGTG 
CAAAAAGTTT 
TTACTTTTTT 
CTGTCTGTTA 
CAGCCTGCAA 
AAAATAAGGC 
TGTGGTGGGT 
AAGCCATCGA 
TGACTGTTAT 
TTGTTGGCCT 
GTGTGTTTGT 
AAGT CAT AC A 
GAGTCTTCAG 
AGCAAGTGAA 
ATATCCCATG 
TAAAATACCT 
AGACATGCAC 
AAA GT CGAAG 
AACACAAAAA 
TGGGAACCAG 
ATGATTACCT 
GAGAGGTGAA 
CTGCCTCGCC 
AGGCAGGCAG 
TTACTGACAC 
GCAGCCTCAA 
AGGGAGGTGG 
TTTGTGTTAC 
TTTTGCACTT 
TATGACTCAT 
GTTAATAATA 
TTATGAAGAT 
TGATATAAAA 
ATACATATTT 
TTTTATCATG 
AAATTGTAAA 
AGGAATTTAA 
ATAGTCTCGT 
CAAAGAGTGT 
TAAAATGTCC 
AATTGACTTC 
AGTTGCTTAT 
ATTATACAGT 



21 

1 

AACCCCGGAG 
ACAGCGGCCT 
AAAATGAGTA 
TGAGGATGCA 
GGAGATGTTT 
CTTCACCTGT 
TTTCCCTAAT 
TCTTCCTCTC 
TGTACCAACC 
AGTATATTCT 
TGAATGTGAC 
AGAATTTCTT 
TCCAAGGCAT 
TGCGCCTCCA 
TATTGGAACA 
AATTGATGTT 
CAGCATTGTA 
TAAGGCAGAT 
TTGCACCGTT 
GATTCTTACC 
G CAAAAAGC A 
GCTTCTTGCT 
TTATGACCTG 
TGGGCTCTCT 
ACATGATGGC 
CGGCTTGTAT 
CAGGATTACC 
TCCTTATCAG 
GATGACATTA 
AGAATGGGCT 
AGTACTACAG 
GAAGCACTAT 
CACAGG AG CT 
AGGACAAGAA 
AGCGGACGGA 
AGCAGCATCC 
TGTATCTGAA 
TGGCCTGGCA 
AGGTT CCACA 
TTGT CATTCA 
ACTGGAAGTG 
AAAGTTGCAT 
TTCACACAAA 
TTTTTTTAAT 
TCTACTCTTG 
TCAAGATATT 
GAAAATAAGC 
CTATTGTGAT 
ATAGTCTTCT 
CTTTAAAAAC 
TTTAGGAATT 
CCACTATTGA 
TAAAGGGTTA 
CCTTTTTTAA 
ATTTTTTGTT 
ACCTTTCTCA 



31 
I 

CCGTCTCAGG 
TCGACCGCCC 
AAATAGTGAA 
AAGAGTGATT 
ACATTTTTGT 
GAACCAATTA 
CTGATGGGTC 
GCAAATCTGG 
TGCATAGAAC 
GATTGCAAAA 
AGATTACAAT 
GGTCCTCAGA 
CTTAAGACTT 
TGCCCCAACA 
GTTTCAATAT 
AGAAGATTCA 
TCTCTTATGT 
GAGAAGCTAG 
TTGTTCATGC 
ATTACTTGGT 
GTGTGGTTTC 
CTGAACAAAG 
GATGCTTCTC 
CTTCTTTTAG 
CGGAACCAAG 
CTTGTGCCAT 
TGGGAGATAA 
GCAAAAGCAA 
ATTGTTGGCA 
GGGTTTTTTA 
GAATCATGTG 
AAACCAAGTT 
AC AGCAAAT C 
ACTTTGACAG 
GCTAGCACCC 
AT CT CCAGAC 
AGTGCGCGGA 
CAGAGCAACA 
TCTCTGCTTG 
GATACTTGAA 
ACCTATGCAC 
TGCCTACTGT 
GGTTAATGAC 
AGTGTGGGAG 
GTAAGAGTAT 
TCTTTGCTGA 
TTATATGTAT 
ATTTTAGCAC 
TTTATACTGT 
CCACTTATTG 
TCACAGATCT 
TTGTATTATG 
GTAGACAAAA 
TGTTTCATGA 
TTAACTTTTG 
GACATTTTGT 



41 

1 

TCCCTGGGGG 
CCCGAGTAAT 
ATGAGGAATT 
CATCCAAGCC 
TGACGTGTAT 
CTGTTCCCAG 
ATTATGACCA 
AATGTTCACC 
AAATT CATGT 
AATTAATTGA 
ACTGTGATGA 
AGAAAACAGA 
CTGGGGGACA 
TGTATTTTAA 
TTTGTCTTTG 
GATACCCAGA 
ACTTCATTGG 
AACTTGGTGA 
TTTTGTATTT 
TCTTAGCTGC 
ATGCTGTTGC 
TTGAAGGAGA 
GCTACTTTGT 
CTGGCATTAT 
AAAAACTAAA 
TAGTGACACT 
CTTGGGTCTC 
AAGCTCGACC 
TCTCTGCTGT 
AACGAAATCG 
AGTTTTTCTT 
CACACAAGCT 
ATGGCACTTC 
AAATCCAAA C 
CCAGGTTAAG 
TCTCTGGGGA 
G TGAAGGAAG 
ATTTGCAGGT 
TTCACCCAGT 
GAACATTTTC 
TGTTTTGTAA 
TATACTGGAA 
AACAATATAC 
GACAGAGTTA 
TTTAAGATGT 
AGTATTTAAA 
TTGAACTTTT 
TTTGGTAGCT 
AAAAAAAGAT 
ATACCTTACC 
AAATTATGTA 
CTGCTCACTG 
TGTTAGTCTT 
CCACCCATTG 
TTTCTTAACA 
AG 



51 
I 

GAACGGTGGG 
TGACCCAGGA 
TGAACATTTT 
ATGTGGTAAA 
TTTTCTACCC 
ATGTATGAAA 
GAGTATTGCC 
AAACATTGAA 
GGTTCCACCT 
CACTTTTGGG 
GACTGTTCCT 
ACAAGTCCAA 
AGGATATAAG 
AAGTGATGAG 
TGCAACTCTG 
GAGACCAATT 
ATTTTTGCTG 
CACTGTTGTC 
TTTCACAATG 
AGGAAGAAAA 
ATGGGGAACA 
CAACATTAGT 
ACTCTTGCCA 
TTCCTTAAAT 
GAAATTTATG 
TCTCGGATGT 
TGATCATTGT 
AGAATTGGCT 
CTTCTGGGTT 
CAAGAGAGAT 
AAAGCACAAT 
GAAGGTCATT 
TGCAGTAGCA 
CTCACCAGAA 
AGAACAGGAC 
ACAGGT CG AC 
GATTAGTCCA 
CCCCAGTTCT 
TTCAGGAGTG 
TCTCGTTACT 
GAATCACTGT 
AAAATAGAGT 
CTGAAAACAG 
GAGGAATCTT 
ACTATGCTAT 
TCTTATCCTT 
TTGAAATCCT 
TTTACACTGA 
ATACCAAAAA 
AT CT AAAATG 
ACTGAAATAA 
ATCCTTCTGC 
TTGTATATTA 
ATTGTATTAT 
TTTAGAATAT 



60 
120 
180 
240 
300 
360 
420 
480 
540 



60 
120 
18 0 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 



85 



Seq ID NO: 651 Protein sequence 
Protein Accession #: NP_003497.1 



11 



21 



31 



41 



51 



435 



10 



WO 02/086443 

MEMFTFLLTC IFXjPLLRGHS 
FLPLANLECS PNIETFLCKA 
LECDRLQYCD ETVPVTFDPH 
CAPPCPNMYF KSDELEFAKS 
YSIVSLMYFI GFLLGDSTAC 
VILTITWFLA AGRKWSCEAI 
LYDLDASRYF VLLPLCLCVF 
SGLYLVPLVT LLGCYVYEQV 
LMTLIVGISA VFWVGSKKTC 
KKHYKPSSHK LKVISKSMGT 
KADGASTPRL REQDCGEPAS 
TGLAQSNNLQ VPSSSEPSSL 



PCT/US02/12476 



LFTCEPITVP 
FVPTCIEQIH 
TEFLGPQKKT 
FIGTVSIFCL 
NKADEKLELG 
EQKAVWFHAV 
VGLSLIiLAGI 
NRITWEITWV 
TEWAGFFKRN 
STGATANHGT 
PAASISRLSG 
KGSTSLLVHP 



RCMKMAYNMT 
WPPCRKLCE 
EQVQRDIGPW 
CATLFTFLTF 
DTWLGSQNK 
AWGT PGFLTV 
ISLNHVRQVI 
SDHCRQYHIP 
RKRDPISESR 
SAVAITSHDY 
EQVDGKGQAG 
VSGVRKEQGG 



FFPNLMGHYD 
KVYSDCKKLI 
CPRHbKTSGG 
LIDVRRFRYP 
ACTVLFMLLY 
MLLALNKVEG 
QHDGRNQEKL 
CPYQAKAKAR 
RVLQESCEFF 
LGQETLTEIQ 
SVSESARSEG 
GCHSDT 



QSIAAVEMEH 60 

DTFGIRWPEE 120 

QGYKFLGIDQ 18 0 

ERPIIYYSVC 240 

FFTMAGTVWW 300 

DNISGVCFVG 360 

KKFMIR I GVF 42 0 

PELALFMIKY 480 

LKHNSKVKHK 540 

TSPETSMREV 600 

RISPKSDITD 660 



15 



Seq ID NO: 652 DNA sequence 

Nucleic Acid Accession #: NM_014791.1 

Coding sequence; 171.. 2 12 6 



20 



25 



30 



35 



40 



45 



50 



55 



60 



TTGGCGGGCG 
GCCGCGTCTC 
TCCGCCCCTC 
ATGATGAACT 
AGGT CAAACT 
AAAACACACT 
TGAGACATCA 
TGGTTCTTGA 
TGT CAGAAG A 
ACAGCCAGGG 
ATAAATTAAA 
ATCTACAGAC 
CATATCTTGG 
GTGGATTTCT 
GAAAATATGA 
TGCAGGTGGA 
TGCAAGATTA 
ATGATTGCGT 
TAATTTCACT 
AGGCTCGGGG 
CTACCCCATT 
ATAAAAATTA 
GTGCTGCTAC 
AATCTAAATC 
AAAATGTATA 
CAAAGACTCC 
ACACTACACC 
TAAATTCAAC 
GCTCAGTGGA 
CCAAAGTGTT 
GCAAAAGGAA 
CTACAACTAG 
AGAAGCATGT 
TTGGGAAAGT 
TGGGTAT C AG 
ACATCCTATC 
GGTGTGATAC 
CTACCAACTT 
GATATTATTT 
TAATCATGTG 
AATGTAAGCT 
TTGTGAATAT 



11 

I 

GAAGCGGCCA 
TCAGGACAGC 
AGGTTCTTTT 
TCTCAAATAT 
TGCCTGCCAT 
AGGGAGTGAT 
GCATATATGT 
GTACTGCCCT 
GGAGACCCGG 
CTATGCTCAC 
GCTGATTGAC 
ATGCTGTGGG 
ATCAGAGGCA 
ACCATTTGAT 
TGTTCCCAAG 
CCCAAAGAAA 
CAACTATCCT 
AACAGAACTT 
GTGGCAGTAT 
AAAACCAGTT 
CACAGACATC 
TGTGGCGGGA 
TCCCCGAACA 
ATTAACTCCA 
TACTCCTAAG 
AGTTAATAAG 
CTCAAAAGCT 
AGGAACAGAC 
ATTGGATCTC 
TGGGAGCCTT 
GGGTTCTGCC 
ATTAGTGAAT 
TGACTTTGTA 
GACAATGCAA 
GAGGCAGCGG 
TAGCTGCAAG 
AGCCTACATA 
GTTT CTAAAG 
TGTGTATGAA 
GTTTTGTATA 
CTTAACTATG 



21 
I 

CAACCCGGCG 
AGGCCCCTGT 
TCTAATTCCA 
TATGAATTAC 
AT CCTT ACTG 
TTGCCCCGGA 
CAACTCTACC 
GGAGGAGAGC 
GTTGTCTTCC 
AGGGACCTCA 
TTTGGTCTCT 
AGTCTGGCTT 
GATGTTTGGA 
GATGATAATG 
TGGCTCTCTC 
CGGATTTCTA 
GTTGAGTGGC 
TCTGTACATC 
GATCACCTCA 
CGTTTAAGGC 
AAGTCAAATA 
TTAATAGACT 
TCACAGTTTA 
GCCTTATGCA 
TCTGCTGTAA 
AACCAGCATA 
AGAAACCAGT 
AAGTTAATGA 
AACCAAGCAC 
GAAAGGGGGT 
AGAGACGGGC 
CCAGATCAAC 
CAAAAGGGTT 
TTTGAATTAG 
CTTAAGGGCG 
GTATAATTGA 
AAG AC TGT T A 
AG C TAT CT T A 
TCTAAATCAA 
TTAATAATTG 
TCTCTTTGTA 



31 
I 

ATCGAAAAGA 
CCTTCTGTCG 
AATAAACTTG 
ATGAAACTAT 
GAGAGATGGT 
TCAAAACGGA 
ATGTGCTAGA 
TGTTTGACTA 
GTCAGATAGT 
AGCCAGAAAA 
GTGCAAAACC 
ATGCAGCACC 
GCATGGGCAT 
TAATGGCTTT 
CCAGTAGCAT 
TGAAAAATCT 
AAAGCAAGAA 
ACAGAAACAA 
CGGCTACCTA 
TTTCTTCTTT 
ATTGGAGTCT 
ATGATTGGTG 
CCAAGTACTG 
GAACACCTGC 
AGAATGAAGA 
AGAGAGAAAT 
GCCTGAAAGA 
CAGGTGTCAT 
ATATGGAGGA 
TGGATAAGGT 
CCAGAAGACT 
TGTTGAATGA 
ATACACTGAA 
AAGTGTGCCA 
ATGCCTGGGT 
TGGATTCTTC 
TGATCGCTTT 
AGACCAATAT 
GCCCATCTGT 
TTGACTTTCT 
ATGTGTAATT 



41 
I 

TTCTTAGGAA 
GGCGCCGCTC 
CAAGAGGACT 
TGGGACAGGT 
AGCTATAAAA 
GATTGAGGCC 
GACAGCCAAC 
TATAATTTCC 
ATCTGCTGTT 
TTTGCTGTTT 
CAAGGGTAAC 
TGAGTTAATA 
ACTGTTATAT 
ATACAAGAAG 
TCTGCTTCTT 
ATTGAACCAT 
TCCTTTTATT 
CAGGCAAACA 
TCTTCTGCTT 
CTCCTGTGGA 
GGAAGATGTG 
TGAAGATGAT 
GACAGAATCA 
AAATAAATTA 
GTACTTTATG 
ACTCACTACG 
AACTCCAATT 
TAGCCCTGAG 
GACTCCAAAA 
TATCACTGTG 
AAAGCTTCAC 
AATAATGTCT 
GTGTCAAACA 
GCTTCAAAAA 
TTACAAAAGA 
CATCCTGCCG 
GATTTTAAAG 
CTCTTTGTTT 
CATTATGTTA 
TAGATTCACT 
TCTTTCTGAA 



51 



CGCCGTACCA 60 

AGCCGTGCCC 12 0 

ATGAAAGATT 180 

GGCTTTGCAA 240 

ATCATGGATA 300 

TTGAAGAACC 3 60 

AAAATATTCA 42 0 

CAGGATCGCC 480 

GCTTATGTGC 540 

GATGAATATC 60 0 

AAGGATTACC 660 

CAAGGCAAAT 720 

GTTCTTATGT 780 

ATTATGAGAG 840 

CAACAAATGC 900 

CCCTGGATCA 960 

CACCTCGATG 1020 

ATGGAGGATT 1080 

CTAGCCAAGA 1140 

CAAGCCAGTG 12 00 

ACCGCAAGTG 12 60 

T T ATCAAC AG 1320 

AATGGGGTGG 1380 

AAGAAC AAAG 1440 

TTTCCTGAGC 1500 

CCAAATCGTT 1560 

AAAAT ACCAG 1620 

AGGCGGTGCC 1680 

AGAAAGGGAG 174 0 

CTCACCAGGA 1800 

TATAATGTGA 1860 

ATTCTTCCAA 192 0 

CAGTCAGATT 1980 

CCCGATGTGG 2040 

TTAGTGGAAG 2100 

GATGAGTGTG 2160 

TTCAT TGGAA 2220 

TTAAACAAAA 2280 

CTGTCTTTTT 2340 

TCCATATGTG 2400 

ATAAAACCAT 2460 



65 



70 



75 



80 



85 



Seq ID NO: 653 Protein sequence 
Protein Accession #: NP_055606.1 



I 

MKDYDELLKY 
IiKNLRHQHIC 
AYVHSQGYAH 
QGKSYLGSEA 
QQMLQVDPKK 
MEDLISLWQY 
TASDKNYVAG 
KNKENVYTPK 
KIPVNSTGTD 
LTRSKRKGSA 
QSDFGKVTMQ 



11 
I 

YELHETIGTG 
QLYHVLETAN 
RDLKPENLLF 
DVWSMGILLY 
RISMKNLLNH 
DHLTATYLLL 
LIDYDWCEDD 
SAVKNEEYFM 
KLMTGVISPE 
RDGPRRLKLH 
FELEVCQLQK 



21 



GFAKVKLACH 
KIFMVLEYCP 
DEYHKLKLID 
VLMCGFLPFD 
PWIMQDYNYP 
LAKKARGKPV 
LSTGAATPRT 
FPEPKTPVNK 
RRCRSVELDL, 
YNVTTTRLVN 
PDWGIRRQR 



31 
I 

ILTGEMVAIK 
GGELFDYIIS 
FGLCAKPKGN 
DDNVMALYKK 
VEWQSKNPFI 
RLRLSSFSCG 
SQFTKYWTES 
NQHKREILTT 
NQAHMEETPK 
PDQLIiNEIMS 
LKGDAWVYKR 



41 



IMDKNTLGSD 
QDRLSEEETR 
KDYHLQTCCG 
IMRGKYDVPK 
HLDDDCVTEL 
QASATPFTDI 
NGVESKSLTP 
PNRYTTPSKA 
RKGAKVFGSL 
I LPKKHVDF V 
LVEDILSSCK 



51 
I 

LPRIKTEIEA 
WFRQIVSAV 
SLAYAAPELI 
WLSPSSILLL 
SVHHRNNRQT 
KSNNWSLEDV 
ALCRTPANKL 
RNQCLKETPI 
ERGLDKV I TV 
QKGYTLKCQT 
V 



Seq ID NO: 654 DNA sequence 
Nucleic Acid Accession #: NM_000582 
Coding sequence: 88.. 990 



11 



31 



41 



51 



21 

! i 1 I I I 

GCAGAGCACA GCATCGTCGG GACCAGACTC GTCTCAGGCC AGTTGCAGCC TTCTCAGCCA 

AACGCCGACC AAGGAAAACT CACTACCATG AGAATTGCAG TGATTTGCTT TTGCCTCCTA 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 



60 
120 



436 



10 



15 



20 



25 



WO 02/086443 

GGCATCACCT GTGCCATACC 
CTTTACAACA AATACCCAGA 
CAGAAT CTCC TAGCCCCACA 
GATGATATGG ATGATGAAGA 
AACGACTCTG ATGATGTAGA 
TCTGATGAAT CTGATGAACT 
TTCACTCCAG TTGTCCCCAC 
GGACTGAGGT CAAAATCTAA 
GACGAGGACA TCACCTCACA 
CCCGTTGCCC AGGACCTGAA 
GAAACGAGTC AGCTGGATGA 
TATAAGCGGA AAGCCAATGA 
CTTTCCAAAG TCAGCCGTGA 
GTTGTAGACC CCAAAAGTAA 
TTAGATAGTG CATCTTCTGA 
ATTTAGTCAA AAGAAAAAAT 
CTCAGTTTAT TGGTTGAATG 
ATTAGTTTAG TTTGTGGCTT 
CT ATGTT CAT TCTATAGAAG 
T CATGAAT AG AAATTTATGT 
ATAACATTTT ATGTCACTAT 
TATCTTTTTG TGGTGTGAAT 
AATTGCTTAT TTGTTTTCCC 
GCCTAAAAAA AAAAAAAAAA 



PCT/US02/12476 



AGTTAAACAG 
TGCTGTGGCC 
GACCCTTCCA 
TGATGATGAC 
TGACACTGAT 
GGTCACTGAT 
AGTAGACACA 
GAAGTTTCGC 
CAT G G AAAG C 
CGCGCCTTCT 
CCAGAGTGCT 
TGAGAGCAAT 
ATTCCACAGC 
GGAAGAAGAT 
GGTCAATTAA 
GCTTTATAGC 
TGTATCTATT 
CATGGAAACT 
AAATGCAAAC 
AG AAG CAAAC 
AATCTTTTGT 
AAATCTTTTA 
ACGGTTGTCC 
AAAA 



GCTGATTCTG 
ACATGGCTAA 
AGTAAGTCCA 
CATGTGGACA 
GATTCTCACC 
TTTCCCACGG 
TATGATGGCC 
AGACCTGACA 
GAGGAGTTGA 
GATTGGGACA 
GAAACCCACA 
GAGCATTCCG 
CATGAATTTC 
AAACACCTGA 
AAGGAGAAAA 
AAAATGAAAG 
TGAGTCTGGA 
CCCTGTAAAC 
TATCACTGTA 
AAAATACTTT 
TTTTTAAGTT 
TCTTGAATGT 
AGCAATTAAT 



GAAGTTCTGA 
ACCCTGACCC 
ACGAAAGCCA 
GCCAGGACTC 
AGT CTGATGA 
ACCTGCCAGC 
GAGGTGATAG 
TCCAGTACCC 
ATGGTGCATA 
GCCGTGGGAA 
GCCACAAGCA 
ATGTGATTGA 
ACAGCCATGA 
AATTTCGTAT 
AATACAATTT 
AGAACATGAA 
AATAACTAAT 
TAAAAGCTTC 
TTTTAATATT 
TACCCACTTA 
AGTGTATATT 
AATAAGAATT 
AAAACATAAC 



GGAAAAGCAG 180 

ATCTCAGAAG 240 

TGACCACATG 300 

CATTGACTCG 360 

GTCTCACCAT 42 0 

AACCGAAGTT 480 

TGTGGTTTAT 540 

TGATGCTACA 60 0 

CAAGGCCATC 660 

GGACAGTTAT 72 0 

GTCCAGATTA 780 

TAGTCAGGAA 840 

AGATATGCTG 900 

TTCTCATGAA 960 

CTCACTTTGC 1020 

ATGCTTCTTT 1080 

GTGTTTGATA 1140 

AGGGTTATGT 12 00 

TGTTATTCTC 12 60 

AAAAGAGAAT 1320 

TTGTTGTGAT 1380 

TGGTGGTGTC 1440 

CTTTTTTACT 1500 



Seq ID NO: 655 Protein sequence 
Protein Accession #: NP 000573 



30 



35 



MRIAVICFCL 
PSKSNESHDH 
DFPTDL PATE 
SEELNGAYKA 
NEHSDVIDSQ 



11 
I 

LGITCAIPVK 
MDDMDDEDDD 
VFTPWPTVD 
IPVAQDLNAP 
ELSKVSREFH 



21 
I 

QADSGSSEEK 
DHVDSQDSID 
TYDGRGDSW 
SDWDSRGKDS 
SHEFHSHEDM 



31 
I 

QLYNKYPDAV 
SNDSDDVDDT 
YGhRSKSKKF 
YETSQLDDQS 
LWDPKSKEE 



41 



ATWLNPDPSQ 
DDSHQSDESH 
RRPDIQYPDA 
AETHSHKQSR 
DKHLKFR I SH 



51 
I 

KQNLLAPQTL 60 
HSDESDELVT 12 0 
TDEDITSHME 180 
LYKRKANDES 240 
ELDSASSEVN 



40 



Seq ID NO: 656 DNA sequence 

Nucleic Acid Accession #: NM_003108.1 

Coding sequence: 76.. 1401 



45 



50 



55 



60 



65 



70 



75 



GGGGTGGGAG 
GCCCTGCAAC 
CGGGAGGCGC 
GAGAGCGACC 
TTCATGGTAT 
AACGCCGAGA 
ATCCCGTTCA 
TACAAGTACC 
C AG AG C C C AG 
GGTGCCAAGA 
GCGGGCGCCA 
GACGACTACG 
ACGGTCAAGT 
CAGCTG CAG A 
CTGCAGCCGC 
CCCGCCAGCC 
GAGGTGCGGG 
AAGAACATCA 
TCGCGCTCGG 
GAGGACGCCG 
GCCAGCGAGC 
GATAAGGATT 
TACTGCACGC 
GACCTGGTGT 
AGCTGGGTTC 
ATGATGGTGG 
AT AT TGATAA 
TTAAAGTGAA 
TCCTTTATCG 
AAAATGTGTT 
GAGGGGGCGG 
GTCGGTCTTT 
TCTAGGGAGT 
TTTTTAACAA 



11 
I 

GGGGAGGGGG 
GGATCATGGT 
TGGACACGGA 
CAGACTGGTG 
GGTCCAAGAT 
TCTCCAAGAG 
TCCGGGAGGC 
GGCCCCGGAA 
AGAAGAGCGC 
CCT CCAAGGG 
AGGCGGGCGC 
TGCTGGGCAG 
GCGTGTTTCT 
TCAAACAGGA 
CGGGG CAGCA 
CTACGCTGAG 
CCGGCGCGAC 
CCAAGCAGCA 
TGTCCACCTC 
ACGACCTGAT 
AGCAGCTGGG 
TGGATTCGTT 
CGGAGCTGAG 
TCACATATTG 
CTTGGGAGGA 
TGTTGATGGT 
GATGT CGTG A 
ATGAGTAGTT 
TGTCTCAAGG 
T TTGTAATT A 
CGCGGCGGAG 
GAAGTCTGGA 
TGGTGGAGAT 
AAAAAGGG 



21 
1 

ACCTCCGCAC 
GCAGCAGGCG 
GGAGGGCGAA 
CAAGACGGCG 
CGAACGCAGG 
GCTGGGCAAG 
GGAGCGGCTG 
AAAGCCCAAA 
GGCCGGCGGC 
CTCCAGCAAG 
GGGCAAGGCG 
CCTGCGCGTG 
GGATGAGGAC 
GCCGGACGAG 
GCCGTCGCAG 
CAGCTCGGCG 
CTCGGGCGCC 
CCCGCCGCCG 
CTCGTCCAGC 
GTTCGACCTG 
GGGCGGCGCG 
CAGCGAGGGC 
CGAGATGATC 
AAAGGCGCCC 
AGTTGTAGTG 
GGCGGTGGTA 
CGCAAAGAAA 
TTTAAACATT 
TAGTTGCATA 
CTATTTCTTT 
GGGAGGTAGG 
AGACGTCTGC 
ATTTTTTTTT 



31 



41 



51 



GAGACCCAGC 
GAGAGCTTGG 
TTCATGGCTT 
TCGGGCCACA 
AAGATCATGG 
CGCTGGAAAA 
CGGCTCAAGC 
ATGGACCCCT 
GGCGGCGGGA 
AAATGCGGCA 
GCCCAGTCCG 
AGCGGCTCGG 
GACGACGACG 
GAGGACGAGG 
CTGCTGAGAC 
GAGTCCCCCG 
GGGGGCGGCA 
CTCGCGCAGC 
AGCAGCGGCA 
AGCTTGAATT 
GCGGCCGGGA 
AGCCTGGGCT 
GCGGGGGACT 
GCTGCTCGCT 
GTGATGATGA 
GGGTGGAGGG 
TTGGAAAACA 
TTTCCTGTCC 
CCTAGTCTGG 
TTCCTGAAAT 
ACCCGCTCCG 
AGAGGACCCT 
CTTAAGAGAA 



GGCCCGGGTT 
AAGCGGAGAG 
GCAGCCCGGT 
TCAAGCGGCC 
AGCAGTCTCC 
TGCTGAAGGA 
ACATGGCCGA 
CGGCCAAGCC 
GCGCGGGCGG 
AGCTCAAGGC 
GGGACTACGG 
GCGGCGGCGG 
ACGACGACGA 
AACCACCGCA 
GCTACAACGT 
AGGGAGCGAG 
GCCGCCTCTA 
CCGCGCTGTC 
GCAGCAGCGG 
TCTCTCAAAG 
ACCTGTCCCT 
CCCACTTCGA 
GGCTGGAGGC 
CTTTCTCTCG 
TGATGATGAT 
GAGAGAAGAA 
TGATGAAAAT 
TTTTTTTGTC 
AGTTGTGATT 
TCGTGATTGC 
GAAGGCGCTG 
TTTGG CAGCA 
CTTAAAGAAC 



GGAGCGTCCA 60 

CAACCTGCCC 12 0 

GGCCCTGGAC 180 

GATGAACGCG 240 

GGACATGCAC 300 

CAGCGAGAAG 3 60 

CTACCCCGAC 42 0 

CAGCGCCAGC 480 

AGGCGCGGGC 540 

CCCCGCGGCC 600 

GGGCGCGGGC 660 

CGCGGGCAAG 720 

CGACGAGCTG 780 

CCAGCAGCTC 840 

CGCCAAAGTG 900 

CCTCTACGAC 960 

CTACAGCTTC 1020 

GCCCGCGTCC 1080 

CAGCAGCGGC 1140 

CGCGCACAGC 1200 

GTCGCTGGTG 1260 

GTTCCCCGAC 132 0 

GAACTTCTCC 1380 

GAGGGTGCAG 1440 

AATGATGATG 1500 

GATGCTGATG 1560 

TTTGGTGGAG 1620 

CCCCCTCCCT 1680 

ATTTTCCCAA 1740 

AACAAAGGCA 180 0 

TTTGAAGCTT 1860 

CAACTGTTAC 1920 

TGGTGATTTT 1980 



Seq ID NO: 657 Protein sequence 
80 Protein Accession #: NP 003099.1 



1 11 21 31 41 51 

I 1 I I 1 I 

MVQQAESLEA ESNLPREALD TEEGEFMACS PVALDESDPD WCKTASGH I K RPMNAFMVWS 60 

85 KIERRKIMEQ SPDMHNAEIS KRLGKRWKML KDSEKIPFIR EAERLRLKHM ADYPDYKYRP 120 

RKKPKMDPSA KPSASQSPEK SAAGGGGGSA GGGAGGAKTS KG S SKKCGKL KAPAAAGAKA 180 

GAGKAAQSGD YGGAGDDYVL GSLRVSGSGG GGAGKTVKCV FLDEDDDDDD DDDELQLQIK 240 



437 



WO 02/086443 

QEPDEEDEEP PHQQIiLQPPG QQPSQLLRRY 
ATSGAGGGSR LYYSFKNITK QHPPPLAQPA 
LMFDLSLNFS QSAHSASEQQ LGGGAAAGNL 
LSEMIAGDWL EANFSDLVFT Y 



NVAkvPASPT LSSSAESPEG ASLYDEVRAG 
LSPASSRSVS TSSSSSSGSS SGSSGEDADD 
SLSLVDKDLD SFSEGSLGSH FEFPDYCTPE 



Seg ID NO: 658 DNA sequence 
Nucleic Acid Accession #: NM_001719 
Coding sequence: 123.. 1418 



1 11 21 31 41 51 

I 1 ! I I I 

GGGCGCAGCG GGGCCCGTCT GCAGCAAGTG ACCGACGGCC GGGACGGCCG CCTGCCCCCT 

CTGCCACCTG GGGCGGTGCG GGCCCGGAGC CCGGAGCCCG GGTAGCGCGT AGAGCCGGCG 

CGATGCACGT GCGCTCACTG CGAGCTGCGG CGCCGCACAG CTTCGTGGCG CTCTGGGCAC 

CCCTGTTCCT GCTGCGCTCC GCCCTGGCCG ACTTCAGCCT GGACAACGAG GTGCACTCGA 

GCTTCATCCA CCGGCGCCTC CGCAGCCAGG AGCGGCGGGA GATGCAGCGC GAGATCCTCT 

CCATTTTGGG CTTGCCCCAC CGCCCGCGCC CGCACCTCCA GGGCAAGCAC AACT CGGCAC 

CCATGTTCAT GCTGGACCTG TACAACGCCA TGGCGGTGGA GGAGGGCGGC GGGCCCGGCG 

GCCAGGGCTT CTCCTACCCC TACAAGGCCG TCTTCAGTAC CCAGGGCCCC CCTCTGGCCA 

GCCTGCAAGA TAGCCATTTC CTCACCGACG CCGACATGGT CATGAGCTTC GTCAACCTCG 

TGGAACATGA CAAGGAATTC TTCCACCCAC GCTACCACCA TCGAGAGTTC CGGTTTGATC 

TTTCCAAGAT CCCAGAAGGG GAAGCTGT C A CGGCAGCCGA ATTCCGGATC TACAAGGACT 

ACATCCGGGA ACGCTTCGAC AATGAGACGT TCCGGATCAG CGTTTATCAG GTGCTCCAGG 

AG CACTTGGG CAGGGAATCG GATCTCTTCC TGCTCGACAG CCGTACCCTC TGGGCCTCGG 

AGGAGGGCTG GCTGGTGTTT GACATCACAG CCACCAGCAA CCACTGGGTG GTCAATCCGC 

GGCACAACCT GGGCCTGCAG CTCTCGGTGG AGACGCTGGA TGGGCAGAGC ATCAACCCCA 

AGTTGGCGGG CCTGATTGGG CGGCACGGGC CCCAGAACAA GCAGCCCTTC ATGGTGGCTT 

TCTTCAAGGC CACGGAGGTC CACTTCCGCA GCATCCGGTC CACGGGGAGC AAACAGCGCA 

GCCAGAACCG CTCCAAGACG CCCAAGAACC AGGAAGCCCT GCGGATGGCC AACGTGGCAG 

AGAACAGCAG CAGCGACCAG AGGCAGGCCT GTAAGAAGCA CGAGCTGTAT GTCAGCTTCC 

GAGACCTGGG CTGGCAGGAC TGGAT CAT CG CGCCTGAAGG CTACGCCGCC TACTACTGTG 

AGGGGGAGTG TGCCTTCCCT CTGAACTCCT ACATGAACGC CACCAACCAC GCCATCGTGC 

AGACGCTGGT CCACTTCATC AACCCGGAAA CGGTGCCCAA GCCCTGCTGT GCGCCCACGC 

AGCTCAATGC CATCTCCGTC CTCTACTTCG ATGACAGCTC CAACGTCATC CTGAAGAAAT 

ACAGAAACAT GGTGGTCCGG GCCTGTGGCT GCCACTAGCT CCTCCGAGAA TTCAGACCCT 

TTGGGGCCAA GTTTTTCTGG ATCCTCCATT GCTCGCCTTG GCCAGGAACC AGCAGACCAA 

CTGCCTTTTG TGAGACCTTC CCCTCCCTAT CCGCAACTTT AAAGGTGTGA GAGTATTAGG 

AAACATGAGC AGCATATGGC TTTTGATCAG TTTTTCAGTG GCAGCATCCA ATGAACAAGA 

TCCTACAAGC TGTGCAGGCA AAACCTAGCA GGAAAAAAAA ACAACGCATA AAGAAAAATG 

GCCGGGCCAG GTCATTGGCT GGGAAGTCTC AGCCATGCAC GGACTCGTTT CCAGAGGTAA 

TTATGAGCGC CTACCAGCCA GGCCACCCAG CCGTGGGAGG AAGGGGGCGT GGCAAGGGGT 

GGGCACATTG GTGTCTGTGC GAAAGGAAAA TTGACCCGGA AGTTCCTGTA ATAAATGTCA 

CAATAAAACG AATGAATG 



Seq ID NO: 65 9 Protein sequence 
Protein Accession #: NP 001710 



1 11 21 31 41 51 

I I I I l ) 

MHVRSLRAAA PHSFVALWAP LFLLRSALAD FSLDNEVHSS FIHRRLRSQE RREMQREILS 

ILGLPHRPRP HLQGKHNSAP MFMLDLYNAM AVEEGGGPGG QGFSYPYKAV FSTQGPPLAS 

LQDSHFLTDA DMVMSFVNLV EHDKEFFHPR YHHREFRFDL SKIPEGEAVT AAEFRIYKDY 

IRERFDNETF RISVYQVLQE HLGRESDLFL LDSRTLWASE EGWLVFDITA TSNHWWNPR 

HNLGLQLSVE TLDGQSINPK LAGLIGRHGP QNKQPFMVAF FKATEVHFRS IRSTGSKQRS 

QNRSKTPKNQ EALRMANVAE NSSSDQRQAC KKHELYVSFR DLGWQDWIIA PEGYAAYYCE 

GECAFPLNSY MNATNHA I VQ TLVHFINPET VPKPCCAPTQ LNAISVLYFD DSSNVILKKY 
RNMWRACGC H 



Seq ID NO: 660 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 211.. 1895 

1 11 21 31 41 51 

I I i I I l 

GG AT CTGAGG GGCGCCCAGT CACTTCCTCC ACGTTCT CGT GCTGGGCGGG AGGAGCGGAT 
GGGGCTTGGG AGGCAGCCTG CTCTCCAGTC CCTATCCACC CACAGGTTTT TTGGGTCGGA 
GAGGAATTAT CTGATAAAAT TCCTGGGTTA ATATTTTTAA AAACGGAGAG TTTTTAAAAA 
TGATTTTTTT CCCTCGAAAA TGACCTTTTT ATGCTTCGAA GCAGTTTGTC AACCAGCATA 
GTGCTTTTTC TTTTCTCTTC TTTTTCTACG ATAAATGAAA GCATTTCTTC AAGAAAAAGG 
CACAGGTTCC TTGAACAGCT GGATTCTGAT GGCACCATTA CTATAGAGGA GCAGATTGTC 
CTTGTGCTGA AAGCGAAAGT ACAATGTGAA CTCAACATCA CAGCTCAACT CCAGGAGGGA 
GAAGGTAATT GTTTCCCTGA ATGGGATGGA CTCATTTGTT GGCCCAGAGG AACAGTGGGG 
AAAATAT CGG CTGTTCCATG CCCTCCTTAT ATTTATGACT TCAACCATAA AGGAGTTGCT 
TTCCGACACT GTAACCCCAA TGGAACATGG GATTTTATGC ACAGCTTAAA TAAAACATGG 
GCCAATTATT CAGACTGCCT TCGCTTTCTG CAGCCAGATA TCAGCATAGG AAAGCAAGAA 
TTCTTTGAAC GCCTCTATGT AATGTATACC GTTGGCTACT CCATCTCTTT TGGTTCCTTG 
GCTGTGGCTA TTCTCATCAT TGGTTACTTC AGACGATTGC ATTGCACTAG GAACTATATC 
CACATGCACT TATTTGTGTC TTTCATGCTG AGAGCTACAA GCATCTTTGT CAAAGACAGA 
GTAGT CCATG CTCACATAGG AGTAAAGGAG CTGGAGTCCC TAATAATGCA GGATGACCCA 
CAAAATTCCA TTGAGGCAAC TTCTGTGGAC AAATCACAAT AT AT CGGGTG CAAGATTGCT 
GTTGTGATGT T TAT T TACT T CCTGGCTACA AATTATTATT GGATCCTGGT GGAAGGTCTC 
TACCTGCATA ATCTCATCTT TGTGGCTTTC TTTTCGGACA CCAAATACCT GTGGGGCTTC 
ATCTTGATAG GCTGGGGGTT TCCAGCAGCA TTTGTTGCAG CATGGGCTGT GGCACGAGCA 
ACTCTGGCTG ATGCGAGGTG CTGGGAACTT AGTGCTGGAG ACATCAAGTG GATTTATCAA 
GCACCGATCT TAGCAGCTAT TGGGCTGAAT TTTATTCTGT TTCTGAATAC GGTTAGAGTT 
CTAGCTACCA AAAT CTGGG A GACCAATGCA GTTGGGCATG ACACAAGGAA GCAATACAGG 
AAACTGGCCA AATCGACACT GGTCCTGGTC CTAGTCTTTG GAGTGCATTA CAT CGTGTTC 



438 



10 



15 



20 



WO 02/086443 

GTATGCCTGC CTCACTCCTT 
TTCTTCAACT CCTTT CAGGG 
GTTCAGGCAG AGGTGAAGAA 
ACACCGCCAT GTGGCAGCCG 
AGCAGCCAGT CACAGGTGGC 
AAGATCGCCA GCAGACAGCC 
TCAGAGCAGG ACTGCCTGCC 
CAGGGAGATG ATATTCTAAT 
GAAGGATGCC AAGGAGAAAC 
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CACTGGGCTC 
TTTCTTTGTG 
GATGTGGAGT 
CAGATGCGGC 
GGCCAGCACA 
TGACAGCCAC 
ACACTCTTTC 
GGAGAAGCCT 
TGAGGATGTT 



GGGTGGGAGA 
TCTATCATCT 
CGGTGGAATC 
TCAGTGCTCA 
CGCATGGTGC 
ATCACTTTAC 
CACGAGGAGA 
TCCAGGCCTA 
CTCTGA 



TCCGCATGCA 
ACTGCTACTG 
TCTCCGTGGA 
CCACCGTGAC 
TTATCTCTGG 
CTGGCTATGT 
CCAAGGAAGA 
TGGAATCTAA 



CTGTGAGCTC 
CAATGGAGAG 
CTGGAAAAGG 
GCACAGCACC 
CAAAGCTGCC 
CTGGAGTAAC 
TAGTGGGAGG 
CCCAGACACT 



Seq ID NO: 661 Protein sequence 
Protein Accession #: Eos sequence 



25 



MhRSSLSTSI 
LNITAQLQEG 
DPMHSLNKTW 
RRLHCTRNYI 
KSQYIGCKIA 
FVAAWAVARA 
VGHDTRKQYR 
SIIYCYCNGE 
RMVLISGKAA 
SRPMESNPDT 



11 
I 

VhFLFSSFST 
EGNCFPEWDG 
ANYSDCLRFL 
HMHLFVSFML 
WMFIYFLAT 
TLADARCWEL 
KLAKSTLVIiV 
VQAEVKKMWS 
KIASRQPDSH 
EGCQGETEDV 



21 
I 

INESISSRKR 
LICWPRGTVG 
QPDISIGKQE 
RATS I FVKDR 
NYYWILVEGL 
SAGDIKWIYQ 
LVFGVHYIVF 
RWNLSVDWKR 
ITLPGYVWSN 
L 



31 
I 

HRFI/EQLDSD 
KISAVPCPPY 
FFERLYVMYT 
WHAHIGVKE 
YLHNLIFVAF 
APILAAIGLN 
VCLPHSFTGL 
TPPCGSRRCG 
SEQDCLPHSF 



41 
I 

GTITIEEQIV 
IYDFNHKGVA 
VGYSISFGSL 
IiESIiIMQDDP 
FSDTKYLWGF 
FILFLNTVRV 
GWEIRMHCEL 
SVLTTVTHST 
HEETKEDSGR 



51 
I 

LVLKAKVQCE 
FRHCNPNGTW 
AVAILIIGYF 
QNSIEATSVD 
ILIGWGFPAA 
LATKIWETNA 
FFNSFQGFFV 
SSQSQVAAST 
QGDDILMEKP 



1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 



60 
12 0 
180 
240 
300 
360 
420 
480 
540 



Seq ID NO; 662 DNA sequence 
Nucleic Acid Accession #: NM_005048 
Coding sequence: 143.. 1795 

30 

1 11 21 31 41 51 

I I I I I I 

GGCCGGTGGC CCGGGCCCGA CCACCCCAGC TGCGCGTCGT TACTGGCCAC AAGTTTGCTC 60 

TGGGCCAGCC AAGTTGGCAA CTTGGAAGCT TCTCCCGGGC TCTGGAGGAG GGTCCCTGCT 12 0 

35 TCTTCCTACA GCCGTTCCGG GCATGGCCGG GCTGGGGGCG TCGCTCCACG TCTGGGGTTG 180 

GCTAATGCTC GGCAGCTGCC TCCTGGCCAG AGCCCAGCTG GATT CTGATG GCACCATTAC 240 

TATAGAGGAG CAGATTGTCC TTGTGCTGAA .AGCGAAAGTA CAATGTGAAC TCAACATCAC 300 

AGCTCAACTC CAGGAGGGAG AAGGTAATTG TTTCCCTGAA TGGGATGGAC TCATTTGTTG 360 

GCCCAGAGGA ACAGTGGGGA AAATAT CGGC TGTTCCATGC CCTCCTTATA TTTATGACTT 420 

40 CAACCATAAA GGAGTTGCTT TCCGACACTG TAACCCCAAT GGAACATGGG ATTTTATGCA 480 

CAGCTTAAAT AAAACATGGG CCAATTATTC AGACTGCCTT CGCTTTCTGC AGCCAGATAT 540 

CAGCATAGGA AAGCAAGAAT TCTTTGAACG CCTCTATGTA ATGTATACCG TTGGCTACTC 600 

CATCTCTTTT GGTTCCTTGG CTGTGGCTAT TCTCATCATT GGTTACTTCA GACGATTGCA 660 

TTGCACTAGG AACTATATCC ACATGCACTT ATTTGTGTCT TTCATGCTGA GAGCTACAAG 720 

45 CATCTTTGTC AAAGACAGAG TAGTCCATGC TCACATAGGA GTAAAGGAGC TGGAGTCCCT 7 80 

AATAATGCAG GATGACCCAC AAAATT CC AT TGAGGCAACT TCTGTGGACA AATCACAATA 84 0 

TATCGGGTGC AAGATTGCTG TTGTGATGTT TATTTACTTC CTGGCTACAA ATTATTATTG 900 

GATCCTGGTG GAAGGTCTCT ACCTGCATAA TCTCATCTTT GTGGCTTTCT TTTCGGACAC 960 

CAAATACCTG TGGGGCTTCA TCTTGATAGG CTGGGGGTTT CCAGCAGCAT TTGTTGCAGC 102 0 

50 ATGGGCTGTG GCACGAGCAA CTCTGGCTGA TGCGAGGTGC TGGGAACTTA GTGCTGGAGA 10 80 

CATCAAGTGG ATTTATCAAG CACCGATCTT AGCAGCTATT GGGCTGAATT TTATTCTGTT 1140 

TCTGAATACG GTTAGAGTTC TAGCTACCAA AAT CTGGGAG ACCAATGCAG TTGGGCATGA 12 0 0 

CACAAGGAAG CAATACAGGA AACTGGCCAA AT CGACACTG GTCCTGGTCC TAGTCTTTGG 1260 

AGTGCATTAC ATCGTGTTCG TATGCCTGCC TCACTCCTTC ACTGGGCTCG GGTGGGAGAT 1320 

55 CCGCATGCAC TGTGAGCTCT TCTTCAACTC CTTTCAGGGT TTCTTTGTGT CTATCATCTA 13 80 

CTGCTACTGC AATGGAGAGG TTCAGGCAGA GGTGAAGAAG ATGTGGAGTC GGTGGAATCT 1440 

CTCCGTGGAC TGGAAAAGGA CACCGCCATG TGGCAGCCGC AGATGCGGCT CAGTGCTCAC 1500 

CACCGTGACG CACAGCACCA GCAGCCAGTC ACAGGTGGCG GCCAGCACAC GCATGGTGCT 1560 

TATCTCTGGC AAAGCTGCCA AGATCGCCAG CAGACAGCCT GACAGCCACA TCACTTTACC 162 0 

60 TGGCTATGTC TGGAGTAACT CAGAGCAGGA CTGCCTGCCA CACTCTTTCC ACGAGGAGAC 168 0 

CAAGGAAGAT AGTGGGAGGC AGGGAGATGA TATT CTAATG GAGAAGCCTT CCAGGCCTAT 1740 

GGAATCTAAC CCAGACACTG AAGGATGCCA AGGAGAAACT GAGGATGTTC TCTGAATGGA 1800 

CATTTGTGGC TGACTTTCAT GGGCTGGTCC AATGGCTGGT TGTGTGAGAG GGCTTGGCTG 1860 

ATACTCCTAT GCTTGAGTTC AAAGGCTGAA AATTCAGTTA AGGTGTTACT TAATAATAGT 1920 

65 TTTTAGGCTC CATGAATTGG CTCCTGTAAA TACTAACGAC ATGAAAATGC AAGTGTCAAT 1980 

GGAGTAGTTT ATTACCTTCT ATTGGCATCA AGTTTTCCTC TAAATTAATG TATGGTATTT 2 040 

GCTCTGTGAT TGTTCATTTT TTTCTGCTAC TTTTGGGTAG AAAAAAGATT CAATTGCTTG 2100 

GCTGTAGCTT TCTCTCATAT ATATCACCCT AAATATAATG AAGATCTTTT AGTGTGTATC 2160 

ATTTTCCTTT TAGAAACTAG TATTCTCTTA TTTCTTACTT TAATGTACTT CTATCACTGC 2220 

70 ATTTATTTTG CCTGTGCATA GGAGCAATTA GGATCTAAAA AAATAT ATGG GAAGATAAAA 22 8 0 

GAT CTAAGAA CAAGTACTTG CTGG AAAATT AGTTGGCTGG ACATTGATAA AATAATGCAT 2340 

TTATAACAAT TACATGTGTT TTTGGGAACA AGGAAAATTT CTCAAAAAAG AATATTTCAC 2400 

ACATCCCTTC TTTTGAATGG CCTCTTTGTG ACCAGCCAGA CCTCAGGTCT TCACTCTTTC 2460 

TTCTTTGTAA ACCATGTCAT GTGGAAAGAT TTCCTCAGTT AGTGAGCTTG TGTCTGCAAA 2520 

75 TTGATTTTGT TTGTAATGTA TTTTGATAGG AAATCATGCT GCATCTATAT CTTTTTCTTG 258 0 

TTTGAGCTGT TACTACATTG TACATGGCAT GTGGGATCAA TTAAAAATTT GTTTTAAAAA 2640 
T 



Seq ID NO: 663 Protein sequence 
80 Protein Accession #: NP_005039 

1 11 21 31 41 51 

1111)1 

MAGLGASI/HV WGWLMLGSCL LARAQLDSDG TITIEEQIVL VLKAKVQCEL NITAQLQEGE 60 

85 GNCFPEWDGI* ICWPRGTVGK ISAVPCPPYI YD FNHKGVAF RHCNPNGTWD FMHSLNKTWA 120 

NYSDCLRFLQ PDISIGKQEF FERLYVMYTV GYSISFGSLA VAIL I IGYFR RLHCTRNYIH 180 

MHLFVSFMLR ATSIFVKDRV VHAHIGVKEL ESLIMQDDPQ NSIEATSVDK SQYIGCKIAV 240 
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40 
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VMFIYFLATN YYWILVEGLY 
LADARCWELS AGDIKWIYOA 
LAKSTLVLVL VFGVHYIVFV 
QAEVKKMWSR WNLSVDWKRT 
IASRQPDSHI TLPGYWSNS 
GCQGETEDVL 



PCT/US02/12476 



LHNLIFVAFF 
PILAAIGLNF 
CLPHSFTGLG 
PPCGSRRCGS 
EQDCLPHSFH 



SDTKYLWGFI 
ILFLNTVRVL 
WEIRMHCELF 
VLTTVTHSTS 
EETKEDSGRQ 



LIGWGFPAAF 
ATKI WETNAV 
FNSFQGFFVS 
SQSQVAASTR 
GDDILMEKPS 



VAAWAVARAT 
GHDTRKQYRK 
IIYCYCNGEV 
MVLISGKAAK 
RPMESNPDTE 



Seq ID NO: 664 DNA sequence 
Nucleic Acid Accession #i NM_012152 
Coding sequence: 43.. 1104 



1 

! 

CTTCTTTAAA 
GACAAGCACA 
GGAACAAAGC 
TCTAATTCTC 
TACCTGTTGG 
ATGTTTAACA 
GGGCTTCTGG 
AGGCACATGT 
CTGCTCATTT 
TGGAATTGCC 
TACCTTGTTT 
CTGCGGATCT 
TCCATCAGCC 
GCGTTTGTGG 
AGGCAGTGTG 
GTCGTGAACC 
ATGATCTGCT 
GTCCTCAGCA 
GTCTGCAATA 
GTCTTAGG 



11 

I 

TTTCTTTCTA 
TGGACTTTTT 
TTGTGATTGT 
TGGTCATCGC 
CTAATTTAGC 
CAGGCCCAGT 
ACAGTAGCTT 
CAATCATGAG 
TGCTTGTCTG 
TCTGCAACAT 
TCTGGACAGT 
ACGTGTACGT 
GCCGGAGGAC 
TATGCTGGAC 
GCGTGCAGCA 
C CAT CAT C T A 
GCTTCTCTCA 
GGAGTGACAC 
AAAGCACTTC 



21 
I 

GGATGTT CAC 
TTATAATAGG 
TTTGTGTGTT 
GGCAGTGATC 
TGCTGCCGAT 
TTCAAAAACT 
GACTGCTTCC 
GATGCGGGTC 
GGCCATCGCC 
CTCTGCCTGC 
GTCCAACCTC 
CAAGAGGAAA 
ACCCATGAAG 
CCCGGGCCTG 
TGTGAAAAGG 
CTCCTACAAG 
GGAGAACCCA 
AGGCAGCCAG 
CTAAACTCTG 



31 

I 

TTCTTCTCCA 
AGCAACACTG 
GGGACGTTTT 
AAAAACAGAA 
TTCTTCGCTG 
TTGACTGTCA 
CTCACCAACT 
CATAGCAACC 
ATTTTTATGG 
TCTTCCCTGG 
ATGGCCTTCC 
ACCAACGTCT 
CTAATGAAGA 
GTGGTTCTGC 
TGGTTCCTGC 
GACGAGGACA 
GAGAGGCGTC 
TACATAGAGG 
GATGCCTCTC 



41 



CAATGAATGA 
ATACTGTCGA 
TCTGCCTGTT 
AATTTCATTT 
GAATTGCCTA 
ACCGCTGGTT 
TGCTGGTTAT 
TGACCAAAAA 
GGGCGGTCCC 
CCCCCATTTA 
TCATCATGGT 
TGTCTCCGCA 
CGGTGATGAC 
TCCTCGACGG 
TGCTGGCGCT 
TGTATGGCAC 
CCTCTCGCAT 
ATAGTATTAG 
GGCCCACCCA 



51 
I 

GTGTCACTAT 
TGACTGGACA 
TATTTTTTTT 
CCCCTTCTAC 
TGTATTCCTG 
TCTCCGTCAG 
CGCCGTGGAG 
GAGGGTGACA 
CACACTGGGC 
CAGCAGGAGT 
TGTGGTGTAC 
TACAAGTGGG 
TGTCTTAGGG 
CCTGAACTGC 
GCTCAACTCC 
CATGAAGAAG 
CCCCTCCACA 
CCAAGGTGCA 
GGTGATGACT 



Seq ID NO: 665 Protein sequence 
Protein Accession #: NP 036284 



45 



MNECHYDKHM 
FHFPFYYLLA 
LVIAVERHMS 
PIYSRSYLVF 
VMTVLGAFW 
YGTMKKMICC 



11 

I - 

DFFYNRSNTD 
NLAAADFFAG 
I MRMRVH SNIi 
WTVSNLMAFL 
CWTPGLWLL 
FSQENPERRP 



21 
I 

TVDDWTGTKL 
IAYVFLMFNT 
TKKRVTLLIL 
IMVWYLRIY 
LDGLNCRQCG 
SRIPSTVLSR 



31 
I 

VIVLCVGTFF 
GPVSKTLTVN 
LVWAIAIFMG 
VYVKRKTNVL 
VQHVKRWFLL 
SDTGSQYIED 



41 

1 

CLFIFFSNSL 
RWFLRQGLLD 
AVPTLGWNCI, 
SPHTSGSISR 
LALLNSWNP 
SISQGAVCNK 



51 
I 

VIAAVIKNRK 
SSLTASLTNL 
CNISACSSLA 
RRTPMKLMKT 
IIYSYKDEDM 
STS 



300 
360 
420 
480 
540 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 



60 
120 
180 
240 
300 



50 



Seq ID NO: 666 DNA sequence 
Nucleic Acid Accession #: NM_002821 
Coding sequence: 150.. 3362 



55 



60 



65 



70 



75 



80 



85 



AACTCCCGCC 
GCGCTCCGGT 
CCTCAGCTCC 
CCCGCCGGTT 
CCATTGTCTT 
TTCGCTGTGA 
CTGTCCAGGA 
ACCGGCTGCA 
AAGCCCGCAG 
TGAAGCATCC 
ACATTGATGG 
ATGGTCAGAG 
GTCCTG AG CA 
GCAGCCAGAA 
CCCAGGACGT 
AGCCACCCCC 
GCCCCCCACA 
TCCGGCCACG 
TCATCCTGGA 
GGGTGTTTAC 
AGCCCAGCGT 
AGAAGGGCCA 
GCCACGCGGC 
TGCCCTCCTG 
TGGATTGCCT 
T CATCT CAGA 
TGGAGGTGTA 
AGGCGCAAGC 
AGCAGTGCAT 
AG CCCACTAT 
ACGCTGGGAC 
TTGCCTCCAA 
TTATCACCTT 
TGCAGTGCGA 
TCCTGGACCC 



11 

I 

TCGGGACGCC 
GCGTCCGCCT 
TTTTCCTGAG 
GCCTCTGCTC 
CAT CAAGCAG 
GGTTGAGGCT 
CACGGAGCGG 
GGACTCTGGC 
TGCCAACGCC 
AGCCTCGGAA 
GCACCCTCGG 
CAACCACACA 
TAGTGGGCTG 
CTTCACCTTG 
GGTAGTAGCG 
GAGCCTGCAG 
CCTCCGCAGA 
CAATGCAGGG 
AGCCACACTT 
AGCTGGCAGC 
GTGGTGGGAG 
CGAGCTGGTG 
CAACCTGGCT 
GCTGAAGAAG 
GACCCAGGCC 
GGACTCACGG 
TGATGGGACA 
CCGTGTCCAA 
GGAGTTTGAC 
TAAGTGGGAA 
CCTGCATTTT 
CGGGCCGCAG 
CAAAGTGGAA 
GGCCCAGGGG 
CACCAAGCTG 



21 

i 

TCGGGGT CGG 
CCTGTGCCCG 
CCCGCCGCGA 
AGCGTCCTGC 
CCGTCCTCCC 
CCGGGCCCGG 
CGTTTCGCCC 
ACCTTCCAGT 
TCCTTCAACA 
GCTGAGATCC 
CCCACCTACC 
GTCAGCAGCA 
TATTCCTGCT 
AGCATTGCTG 
AGGTATGAGG 
TGGCTCTTTG 
GCCACAGTGT 
ATCTACCGCT 
CACCTAGCAG 
GAGGAGCGTG 
CACGCGGGAG 
TTGGCCAATA 
GGTCAGCGGA 
CCCCAAGACA 
ACACCAAAAC 
TTCGAGGTCT 
TGGTACCGTT 
GTGCTGGAAA 
AAGGAGGCCA 
CGGGCAGATG 
GCCCGGGTGA 
GGCCAGATTC 
CCAGAGCGTA 
GACCCCAAGC 
GGACCCAGGA 



31 



GCTCCGGCTG 
CCGCGGAGCA 
TGGGAGCTGC 
TGCTGCCGCT 
AGGATGCACT 
TACATGTGTA 
AGGGCAGCAG 
GTGTGGCTCG 
TCAAATGGAT 
AGCCACAGAC 
AATGGTTCCG 
AGGAGCGGAA 
GCGCCCACAG 
ATGAAAGCTT 
AGGCCATGTT 
AGGATGAGAC 
TTGCCAACGG 
GCATTGGCCA 
AGATTGAAGA 
TGACCTGCCT 
TCCGGCTGCC 
TTGCTGAAAG 
GACAGGATGT 
GCCAGCTGGA 
CTACAGTTGT 
TCAAGAATGG 
GTATGAGCAG 
AGCTCAAGTT 
CGGTGCCCTG 
GGAGCAGCCT 
CTCGAGATGA 
GTGCCCATGT 
CGACTGTGTA 
CGCTGATTCA 
TGCACATCTT 



41 
I 

CGGCTGCTGC 
GTCTGCGGCC 
GCGGGGATCC 
GCTGGGCGGT 
GCAGGGGCGC 
CTGGCTGCTC 
CCTGAGCTTT 
GGATGATGTC 
TGAGGCAGGT 
CCAGGTCACA 
AGATGGGACC 
CCTGACGCTC 
TGCTTTTGGC 
TGCCAGGGTG 
CCATTGCCAG 
TCCCATCACT 
GTCTCTGCTG 
GGGGCAGAGG 
CATGCCGCTA 
TCCCCCCAAG 
CACCCATGGC 
TGATGCTGGT 
CAACATCACT 
GGAGGGCAAA 
CTGGTACAGA 
GACCTTGCGC 
CACCCCAGCC 
CACACCACCA 
TTCAGCCACA 
CCCAGAGTGG 
CGCTGGCAAC 
CCAGCTCACT 
CCAGGGCCAC 
GTGGAAAGGC 
CCAGAATGGC 



51 



TGCGGCGCCC 60 

CGCCGTGCGC 120 

CCGGCCAGAC 180 

ACCCAGACAG 240 

CGGGCGCTGC 300 

GATGGGGCCC 3 60 

GCAGCTGTGG 42 0 

ACTGGAGAAG 4 8 0 

CCTGTGGTCC 540 

CTTCGTTGCC 600 

CCCCTTTCTG 660 

CGGCCAGCTG 720 

CAGGCTTGCA 780 

GTGCTGGCAC 84 0 

TTCTCAGCCC 900 

AACCGCAGTC 960 

CTGACCCAGG 1020 

GGCCCACCCA 1080 

TTTGAGCCAC 1140 

GGTCTGCCAG 12 00 

AGGGTCTACC 1260 

GTCTACACCT 1320 

GTGGCCACTG 13 80 

CCCGGCTACT 1440 

AACCAGATGC 150 0 

ATCAACAGCG 1560 

GGCAGCATCG 162 0 

CCCCAGCCAC 1680 

GGCCGAGAGA 174 0 

GTGACAGACA 18 0 0 

TACACTTGCA 186 0 

GTGGCAGTTT 192 0 

ACAGCCCTAC 1980 

AAGGACCGCA 2 040 

TCCCTGGTGA 2100 



440 



15 



WO 02/086443 

TCCATGACGT GGCCCCTGAG 
ACATCAAGCA CACGGAGGCC 
AGGGCCCTGG CAGCCCTCCC 
CCGCTGTGGC CTACATCATT 
5 AAGCCAAGCG GCTGCAGAAG 

GAGGGCCTTT GCAGAACGGG 
GCTTGGGCTC CGGCCCCGCG 
TCCCACGGTC TAGCCTGCAG 
TCCTGGCAAA GGCTCAGGGC 
10 GCCTGCAGAC GAAG GAT GAG 

GGAAGCTGAA CCACGCCAAC 
ACTACATGGT GCTGGAATAT 
AGAGCAAGGA TGAAAAATTG 
GCACCCAGGT AGCCCTGGGC 
TGGCTGCGCG TAACTGCCTG 
TCAGCAAGGA TGTGTACAAC 
GCTGGATGTC CCCCGAGGCC 
CCTTCGGTGT GCTGATGTGG 
CAGATGATGA AGTACTGGCA 
20 GCTGCCCTTC CAAACTCTAT 
GGCCCTCCTT CAGTGAGATT 
GAGGAGGGAG CCCGCTCAGG 
CAGCATGATG GGCAAGATCC 
TTGCTGAGGT CTGAGCAGGG 
GGCTGACTTG GACCCAAACT 
CTCTTCCTCT ATCAGGGACA 
TTCTCCCCTT GACCGGGTCC 
AGGCTTGGGA TGAGCTGGGT 
AGGGTTAATG AGTCTCTTGC 
ACACAGCAAG TGAGTCCTCC 
CCCCACCCTT CTCTCCTTTC 
CTTTTGACAC TATATAAACC 
TGCAGCGTGG GGTGGGTGGG 
GCCATCCTTA CCCCACACTT 
35 TGTTTTTGTT TTTACACTCG 



25 



30 



GACTCAGGCC 
CCCCTCTATG 
CCCTACAAGA 
GCCGTGCTGG 
CAGCCCGAGG 
CAGCCCTCAG 
GCCACCAACA 
CCCATCACCA 
TTGGAGGAGG 
CAGCAGCAGC 
GTGGTGCGGC 
GTGGATCTGG 
AAGTCACAGC 
ATGGAGCACC 
GTCAGTGCCC 
AGTGAGTACT 
AT CCTGGAGG 
GAAGTGTTTA 
GATTTGCAGG 
CGGCTGATGC 
GCCAGCGCCC 
ATGGCCTGGG 
CTGTCCTCCT 
CCTGGCCTTT 
GGGCGACTAG 
GTGTGGGTGC 
AACTCTGCCA 
TTGTGGGGAG 
CCACTGGTCC 
CCACTCTGGG 
CTCATCCTAA 
GCCCTTTTTG 
CATGGGAGGT 
TTATTGTTGT 
CTGCTCTCAA 



GCTACACCTG 
TCGTGGACAA 
TG AT CCAGAC 
GCCTCATGTT 
GCGAGGAGCC 
CAGAGATCCA 
AACGCCACAG 
CGCTGGGGAA 
GAGTGGCAGA 
TGGACTTCCG 
TCCTGGGGCT 
GAGACCTCAA 
CCCTCAGCAC 
TGTCCAACAA 
AGAGACAAGT 
ACCACTTCCG 
GTGACTTCTC 
CACATGGAGA 
CTGGGAAGGC 
AGCGCTGCTG 
TGGGAGACAG 
CAGGGGAGGA 
GGGCCCTGAG 
CCTCCTCTTC 
GGCTTTGAGC 
CACAGGTAAC 
CTCATCTGCC 
TTCCTTAATA 
ACTTGGGGGT 
CTTGTGCACA 
GTGCCTGGCA 
TATGCACCAC 
AGGGGTGGGC 
CGTTTTTTGT 
TAAATAAGCC 



CATTGCAGGC 
GCCTGTGCCG 
CATTGGGTTG 
CTACTGCAAG 
AGAGATGGAA 
AGAAGAAGTG 
CACAAGTGAT 
GAGTGAGTTT 
GACCCTGGTA 
GAGGGAGTTG 
GTGCCGGGAG 
GCAGTTCCTG 
CAAGCAGAAG 
CCGCTTTGTG 
GAAGGTGTCT 
CCAGGCCTGG 
TACCAAGTCT 
GATGCCCCAT 
TAGACTTCCT 
GGCCCTCAGC 
CACCGTGGAC 
CATCTCTAGA 
GTGCCCTAGT 
CTCACCCTCA 
TGGGCAGTTT 
CCCAATTTCT 
AACTTTGCCT 
TTCTCAAGTT 
CT AG AC CAGG 
CTGACCCAGA 
GATGAAGGAG 
GGGCGGCTTT 
CCTGGAGATG 
TTGTTTTGTT 
TTTTTTA 



AACAGCTGCA 2160 

GAGGAGTCGG 2220 

TCGGTGGGTG 2280 

AAGCGCTGCA 2340 

TGCCTCAACG 2400 

GCCTTGACCA 2460 

AAGATGCACT 2 52 0 

GGGGAGGTGT 2580 

CTTGTGAAGA 2 640 

GAGATGTTTG 2700 

GCTGAGCCCC 2760 

AGGATTTCCA 2820 

GTGGCCCTAT 2880 

CATAAGGACT 2 940 

GCCCTGGGCC 3000 

GTGCCGCTGC 3060 

GATGTCTGGG 3120 

GGTGGGCAGG 3180 

CAGCCCGAGG 3240 

CCCAAGGACC 330 0 

AGCAAGCCGT 3 360 

GGGAAGCTCA 3420 

GCAACAGGCA 3480 

TCCTTTGGGA 3 540 

CCCCTGCCAC 3600 

GGCCTTCAAC 3660 

GGGGAGGGCT 3720 

CTGGGCACAC 37 8 0 

ATTATAGAGG 3 840 

CCCACGTCTT 3 900 

TTTTCAGGAG 3 960 

TATATGTAAT 4020 

AGGAGGGTGG 40 80 

TTTTTGTTTT 4140 
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Seq ID NOi 667 Protein sequence 
Protein Accession #: NP 002812 



40 



45 



50 



55 



60 



65 



70 



75 



80 



I 

MGAARGSPAR 
VHVYWLLDGA 
IKWIEAGPW 
KERNLTLRPA 
EAMPHCQFSA 
CIGQGQRGPP 
VRLPTHGRVY 
SQLEEGKPGY 
CMSSTPAGSI 
GSSLPEWVTD 
TTVYQGHTAL 
RYTCIAGNSC 
GLMFYCKKRC 
KRHSTSDKMH 
LDFRRELEMF 
PLSTKQKVAL 
YHFRQAWVPL 
AGKARLPQPE 



11 

I 

PRRLPLLSVL 
PVQDTERRFA 
LKHPASEAEI 
GPEHSGLYSC 
QPPPSLQWLF 
1ILEATLHLA 
QKGHELVLAN 
LDCLTQATPK 
EAQARVQVLE 
NAGTLHFARV 
LQCEAQGDPK 
NIKHTEAPLY 
KAKRLQKQPE 
FPRSSLQPIT 
GKLNHANWR 
CTQVALGMEH 
RWMSPEAILE 
GCPSKLYRLM 



21 
I 

LLPLLGGTQT 
QGSSLSFAAV 
QPQTQVTLRC 
CAHSAFGQAC 
EDETPITNRS 
EIEDMPLFEP 
IAESDAGVYT 
PTWWYRNQM 
KLKFTPPPQP 
TRDDAGNYTC 
PLIQWKGKDR 
WDKPVPEES 
GEEPEMECLN 
TLGKSEFGEV 
LLGLCREAEP 
LSNNRFVHKD 
GDFSTKSDVW 
QRCWALSPKD 



31 
I 

AIVFIKQPSS 
DRLQDSGTFQ 
HIDGHPRPTY 
SSQNFTLSIA 
RPPHLRRATV 
RVFTAGSEER 
CHAANLAGQR 
LISEDSRFEV 
QQCMEFDKEA 
IASNGPQGQI 
ILDPTKLGPR 
EGPGSPPPYK 
GGPLQNGQPS 
FLAKAQGLEE 
HYMVLEYVDL 
L AARNCLV S A 
AFGVLMWEVF 
RPSFSEIASA 



41 
I 

QDALQGRRAL 
CVARDDVTGE 
QWFRDGTPLS 
DESFARWLA 
FANGSLLLTQ 
VTCLPPKGLP 
RQDVN I TV AT 
FKNGTLRINS 
TVPCSATGRE 
RAHVQLTVAV 
MHIFQNGSLV 
MIQTIGLSVG 
AEIQEEVALT 
GVAETLVLVK 
GDLKQFLRIS 
QRQVKVSALG 
THGEMPHGGQ 
LGDSTVDSKP 



51 
I 

LRCEVEAPGP 
EAR S ANAS FN 
DGQSNHTVSS 
PQDVWARYE 
VRPRNAGIYR 
EPSVWWEHAG 
VPSWLKKPQD 
VEVYDGTWYR 
KPTIKWERAD 
FITFKVEPER 
IHDVAPEDSG 
AAVAYIIAVIi 
SLGSGPAATN 
SLQTKDEQQQ 
KSKDEKLKSQ 
LSKDVYNSEY 
ADDEVLADLQ 



Seq ID NO: 6 68 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..1389 



85 



1 
1 

ATGGGCTACC 
ACCCTTGTTT 
GTTGTCAACT 
GGGTTTCCTT 
GTTTTATTGA 
AAAACTTTCG 
ATAGCAATGA 
ATCCCAGGAG 
ACAGTTACCT 
TCCCTCATCT 
TCACTGGGTC 
ATTCAAGCGG 
TACAGTTCTC 
GTGATTTCTG 
TTCACCCAAG 
AGATTTTGTT 
GAGGTAATTG 
ACAGTGATGG 
GTT CTAGAAC 
TGTTATCTGA 
ATGCTTCCCA 



11 

1 

AGAGGCAGGA 
CTGAACATGA 
CGATTATAGG 
TGGGAATATT 
TAAAAGGAGG 
GCTTTCCAGG 
TAAGTTACAA 
TTGATCCTGA 
TTACTCTGCC 
CTACAGGTTT 
CACACATACC 
TCGGGGTTAT 
TAGAAGAACC 
TATTTATCTG 
GGGACTTATT 
ATGGTGTCAC 
CCAATGTGTT 
TCATCACTGT 
TCAATGGTGT 
AACTGTCTGA 
TTGGTGCTGT 



21 
I 

GCCTGTCATC 
GTATAAAGAG 
ATCTGGTATA 
GCTTTTATTC 
GGCCCTCTCT 
GTATCTGCTC 
TATAATAGCT 
AAACGTGTTT 
TTTATCCTTG 
AACAACT CTG 
AAAAACAGAA 
GTCTTTTGCA 
CACAGTAGCT 
TATATTCTTT 
TGAAAATTAC 
TGTCATTTTG 
TTTTGGTGGG 
AGCCACGCTT 
GCTCTGTGCA 
AGAACCAAGG 
GGTGATGGTT 



31 
I 

CCGCCGCAGA 
AAAACCTGTC 
ATAGGATTGC 
TGGGTTTCAT 
GGAACAGATA 
CTCTCTGTTC 
GGAGATACTT 
AT TGGTCGCC 
TACCGAAATA 
ATTCTTGGAA 
GACGCTTGGG 
TTTATTTGCC 
AAGTGGTCCC 
GCTACATGTG 
TGCAGAAATG 
ACATACCCTA 
AATCTTTCAT 
GTGTCATTGC 
ACTCCCCTCA 
ACACACTCCG 
TTTGGATTCG 



41 



GAGATTTAGA 
AGTCTGCTGC 
CTTATTCAAT 
ATGTTACGGA 
CCTACCAGTC 
TTCAGTTTTT 
TGAGCAAAGT 
ACTTCATTAT 
TAGCAAAGCT 
TTGTAATGGC 
TATTTGCAAA 
ACCATAACTC 
GCCTTATCCA 
GATACTTGAC 
ATGACCTGGT 
TGGAATGCTT 
CGGTTTTCCA 
TGATTGATTG 
TTTTTATCAT 
ATAAGATTAT 
TCATGGCTAT 



51 
I 

TGACAGAGAA 
TCTTTTTAAT 
GAAGCAAGCT 
CTTTTCCCTT 
TTTGGTCAAT 
GTATCCTTTT 
TTTTCAAAGA 
TGGACTTTCC 
TGGAAAGGTC 
AAGGGCAATT 
GCCCAATGCC 
CTTCTTAGTT 
TATGTCCATC 
ATTTACTGGC 
AACATTTGGA 
TGTGACAAGA 
CATTGTTGTA 
CCTCGGGATA 
TCCATCAGCC 
GTCTTGTGTC 
TACAAATACT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
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CAAGACTGCA CCCATGGGCA GGAAATGTTC TACTGCTTTC CTGACAATTT CTCTCTCACA 
AATACCTCAG AGTCTCATGT TCAGCAGACA ACACAACTTT CTACTTTAAA TATTAGTATC 
TTTCAATGA 



Seq ID NO: 669 Protein sequence 
Protein Accession #: Eos sequence 



1 

1 

MGYQRQEPVI 
GFPLGILLLF 
IAMISYNIIA 
SLISTGLTTL 
YSSLEEPTVA 
RFCYGVTVIL 
VLELNGVLCA 
QDCTHGQEMF 



11 
I 

PPQRDLDDRE 
WVSYVTDFSL 
GDTLSKVFQR 
ILGIVMARAI 
KWSRLIHMSI 
TYPMECFVTR 
TPLIFIIPSA 
YCFPDNFSLT 



21 

1 

TLVSEHEYKE 
VLIiIKGGALS 
IPGVDPENVF 
SLGPHIPKTE 
VISVFICIFF 
EVIANVFFGG 
CYLKDSEEPR 
NTSESHVQQT 



31 
I 

KTCQSAALFN 
GTDTYQSLVN 
IGRHFIIGLS 
DAWVFAKPNA 
ATCGYLTFTG 
NLSSVFHIW 
THSDKIMSCV 
TQLSTLNISI 



41 
I 

WNSIIGSGI 
KTFGFPGYLL 
TVTFTLPLSL 
IQAVGVMSFA 
FTQGDLFENY 
TVMVITVATL 
MLPIGAWMV 
FQ 



51 
I 

IGLPYSMKOA 
LSVLQFLYPF 
YRN I AKLGKV 
FICHHNSFLV 
CRNDDLVTFG 
VSLLIDCLGI 
FGFVMAITNT 



Seq ID NO: 670 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..12 84 

1 11 21 31 41 51 

I I 1 I I I 

ATGGGCTACC AGAGGCAGGA GCCTGTCATC CCGCCGCAGA GAGGATTGCC TTATTCAATG 

AAGCAAGCTG GGTTTCCTTT GGGAATATTG CTTTTATTCT GGGTTTCATA TGTTACAGAC 

TTTTCCCTTG TTTTATTGAT AAAAGGAGGG GCCCTCTCTG GAACAGATAC CTACCAGTCT 

TTGGTCAATA AAACTTTCGG CTTTCCAGGG TATCTGCTCC TCTCTGTTCT TCAGTTTTTG 

TATCCTTTTA TAGCAATGAT AAGTTACAAT ATAATAGCTG GAGATACTTT GAGCAAAGTT 

TTTCAAAGAA TCCCAGGAGT TGAT CCTGAA AACGTGTTTA TTGGTCGCCA CTT CATTATT 

GGACTTTCCA CAGTTACCTT TACTCTGCCT TTATCCTTGT ACCGAAATAT AGCAAAGCTT 

GGAAAGGTCT CCCTCATCTC TACAGGTTTA ACAACTCTGA TTCTTGGAAT TGTAATGGCA 

AGGGCAATTT CACTGGGTCC ACACATACCA AAAACAGAAG ACGCTTGGGT ATTTGCAAAG 

CCCAATGCCA TTCAAGCGGT CGGGGTTATG TCTTTTGCAT TTATTTGCCA CCATAACTCC 

TTCTTAGTTT ACAGTTCTCT AGAAGAACCC ACAGTAGCTA AGTGGT CCCG CCTTATCCAT 

ATGTCCATCG TGATTTCTGT ATTTATCTGT ATATTCTTTG CTACATGTGG ATACTTGACA 

TTTACTGGCT TCACCCAAGG GGACTTATTT GAAAATTACT GCAGAAATGA TGACCTGGTA 

ACATTTGGAA GATTTTGTTA TGGTGTCACT GTCATTTTGA CATACCCTAT GGAATGCTTT 

GTGACAAGAG AGGTAATTGC CAATGTGTTT TTTGGTGGGA ATCTTTCATC GGTTTTCCAC 

ATTGTTGTAA CAGTGATGGT CATCACTGTA GCCACGCTTG TGTCATTGCT GATTGATTGC 

CTCGGGATAG TTCTAGAACT CAATGGTGTG CTCTGTGCAA CTCCCCTCAT TTTTATCATT 

CCATCAGCCT GTTATCTGAA ACTGTCTGAA GAACCAAGGA CACACTCCGA TAAGATTATG 

TCTTGTGTCA TGCTTCCCAT TGGTGCTGTG GTGATGGTTT TTGGATTCGT CATGGCTATT 

ACAAATACTC AAGACTGCAC CCATGGGCAG GAAATGTTCT ACTGCTTTCC TGACAATTTC 

TCTCTCACAA ATACCT CAG A GTCTCATGTT CAGCAGACAA CACAACTTTC TACTTTAAAT 

ATTAGTATCT TTCAACTCGA GTAA 



Seq ID NO: 671 Protein sequence 
Protein Accession # : Eos sequence 



1 11 21 31 41 51 

1 I I I 1 I 

MGYQRQEPVI PPQRGLPYSM KQAGFPLGIIi LLFWVSYVTD FSLVLLIKGG ALSGTDTYQS 

LVNKTFGFPG YI>LLSVLQFI> YPFIAMISYN I I AGDTLSKV FQRIPGVDPE NVFIGRHFII 

GLSTVTFTLP LSLYRNIAKL GKVSLISTGL TTLILGIVMA RAISLGPHIP KTEDAWVFAK 

PNAIQAVGVM SFAFICHHNS FLVYS SLEEP TVAKWSRLIH MSIVISVFIC IFFATCGYLT 

FTGFTQGDLF ENYCRNDDLV TFGRFCYGVT VILTYPMECF VTREVIANVF FGGNLSSVFH 

IWTVMVITV ATLVSLLIDC LGIVLELNGV LCATPLIFII PSACYLKLSE EPRTHSDKIM 

SCVMLPIGAV VMVFGFVMAI TNTQDCTHGQ EMFYCFPDNF SLTNTSESHV QQTTQLSTLN 

ISIFQLE 



Seq ID NO: 672 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..1203 



1 11 21 31 41 51 

l l l I l l 

ATGGGCTACC AGAGGCAGGA GCCTGTCATC CCGCCGCAGT TTTCCCTTGT TTTATTGATA 
AAAGGAGGGG CCCTCTCTGG AACAGATACC TACCAGTCTT TGGTCAATAA AACTTTCGGC 
TTTCCAGGGT ATCTGCTCCT CTCTGTTCTT CAGTTTTTGT ATCCTTTTAT AGCAATGATA 
AGTTACAATA TAATAGCTGG AGATACTTTG AGCAAAGTTT TTCAAAGAAT CCCAGGAGTT 
GATCCTGAAA ACGTGTTTAT TGGTCGCCAC TTCATTATTG GACTTTCCAC AGTTACCTTT 
ACTCTGCCTT TATCCTTGTA CCGAAATATA GCAAAGCTTG GAAAGGTCTC CCTCATCTCT 
ACAGGTTTAA CAACTCTGAT TCTTGGAATT GTAATGGCAA GGGCAATTTC ACTGGGT CC A 
CACATACCAA AAACAGAAGA CGCTTGGGTA TTTGCAAAGC CCAATGCCAT TCAAGCGGTC 
GGGGTTATGT CTTTTGCATT TATTTGCCAC CATAACTCCT TCTTAGTTTA CAGTTCTCTA 
GAAGAACCCA CAGTAGCTAA GTGGTCCCGC CTTATCCATA TGTCCATCGT GATTTCTGTA 
TTTATCTGTA TATTCTTTGC TACATGTGGA TACTTGACAT TTACTGGCTT CACCCAAGGG 
GACTTATTTG AAAATTACTG CAGAAATGAT GACCTGGTAA CATTTGGAAG ATTTTGTTAT 
GGTGTCACTG TCATTTTGAC ATACCCTATG GAATGCTTTG TGACAAGAGA GGTAATTGCC 
AATGTGTTTT TTGGTGGGAA TCTTTCATCG GTTTTCCACA TTGTTGTAAC AGTGATGGTC 
ATCACTGTAG CCACGCTTGT GTCATTGCTG ATTGATTGCC TCGGGhTAGT TCTAGAACTC 
AATGGTGTGC TCTGTGCAAC TCCCCTCATT TTTATCATTC CATCAGCCTG TTATCTGAAA 
CTGTCTGAAG AAC CAAGG AC ACACTCCGAT AAGATTATGT CTTGTGTCAT GCTTCCCATT 
GGTGCTGTGG TGATGGTTTT TGGATTCGTC ATGGCTATTA CAAATACTCA AGACTGCACC 
CATGGGCAGG AAATGTTCTA CTGCTTTCCT GACAATTTCT CTCTCACAAA TACCTCAGAG 
TCTCATGTTC AGCAGACAAC ACAACTTTCT ACTTTAAATA TTAGTATCTT TCAACTCGAG 
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TAA 

Seq ID NO: 673 Protein sequence 
Protein Accession # : Eos sequence 

1 11 21 31 41 51 

I I i i l l 

MGYQRQEPVI PPQFSLVLLI KGGALSGTDT YQSLVNKTFG FPGYLLLSVL QFLYPFIAMI 
SYNI I AGDTL SKVFQRIPGV DPENVFIGRH FIIGLSTVTF TLPLSLYRNI AKLGKVSLIS 
TGLTTLILGI VMARAISLGP H I PKTEDAWV FAKPNAIQAV GVMSFAFICH HNSFLVYSSL 
EEPTVAKWSR LIHMSIVISV FICIFFATCG YLTFTGFTQG DLFENYCRND DLVTFGRFCY 
GVTVILTYPM ECFVTREVIA NVFFGGNLSS VFHIWTVMV ITVATLVSLL IDCLGIVLEL 
NGVLCATPLI FIIPSACYLK LSEEPRTHSD KIMSCVMLPI GAWMVFGFV MAITNTQDCT 
HGQEMFYCFP DNFSLTNTSE SHVQQTTQLS TLNTSIFQLE 

Seq ID NO: 674 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..1140 

1 11 21 31 41 51 

I I I i I I 

ATGGGCTACC AGAGGCAGGA GCCTGTCATC CCGCCGCAGG TCAATAAAAC TTTCGGCTTT 

CCAGGGTATC TGCTCCTCTC TGTTCTTCAG TTTTTGTATC CTTTTATAGC AATGATAAGT 

TACAATATAA TAGCTGGAGA TACTTTGAGC AAAGTTTTTC AAAGAATCCC AGGAGTTGAT 

CCTGAAAACG TGTTTATTGG TCGCCACTTC ATTATTGGAC TTTCCACAGT TACCTTTACT 

CTGCCTTTAT CCTTGTACCG AAATATAGCA AAGCTTGGAA AGGTCTCCCT CATCTCTACA 

GGTTTAACAA CTCTGATTCT TGGAATTGTA ATGGCAAGGG CAATTT C ACT GGGTCCACAC 

ATACCAAAAA CAGAAGACGC TTGGGTATTT GCAAAGCCCA ATGCCATTCA AGCGGTCGGG 

GTTATGTCTT TTGCATTTAT TTGCCACCAT AACTCCTTCT TAGTTTACAG TTCTCTAGAA 

GAACCCACAG TAGCTAAGTG GTCCCGCCTT ATCCATATGT CCATCGTGAT TTCTGTATTT 

ATCTGTATAT TCTTTGCTAC ATGTGGATAC TTGACATTTA CTGGCTTCAC CCAAGGGGAC 

TTATTTGAAA AT TACTGCAG AAATGATGAC CTGGTAACAT TTGGAAGATT TTGTTATGGT 

GTCACTGTCA TTTTGACATA CCCTATGGAA TGCTTTGTGA CAAGAGAGGT AATTGCCAAT 

GTGTTTTTTG GTGGG AATCT TTCATCGGTT TTCCACATTG TTGTAACAGT GATGGT CATC 

ACTGTAGCCA CGCTTGTGTC ATTGCTGATT GATTGCCTCG GGATAGTTCT AGAACTCAAT 

GGTGTGCTCT GTGCAACTCC CCTCATTTTT ATCATTCCAT CAGCCTGTTA TCTGAAACTG 

TCTGAAGAAC CAAGGACACA CTCCGATAAG ATTATGTCTT GTGTCATGCT TCCCATTGGT 

GCTGTGGTGA TGGTTTTTGG ATTCGTCATG GCTATTACAA ATACTCAAGA CTGCACCCAT 

GGGCAGGAAA TGTTCTACTG CTTTCCTGAC AATTTCTCTC TCACAAATAC CTCAGAGTCT 

CATGTT CAGC AGACAACACA ACTTTCTACT TTAAATATTA GTATCTTTCA ACTCGAGTAA 

Seq ID NO: 675 Protein sequence 
Protein Accession #: Eos sequence 

1 11 21 31 41 51 

I I I I I 1 

MGYQRQEPVI PPQVNKTFGF PGYLLLSVLQ FLYPFIAMIS YNIIAGDTLS KVFQRIPGVD 

PENVFIGRHF I IGLSTVTFT LPLSLYRNIA KLGKVSLIST GLTTLILGIV MARA I SLGPH 

IPKTEDAWVF AKPNAIQAVG VMSFAFI CHH NSFLVYSSLE EPTVAKWSRL IHMSIVISVF 

ICIFFATCGY LTFTGFTQGD LFENYCRNDD LVTFGRFCYG VTVILTYPME CFVTREVIAN 

VFFGGNLSSV FHIWTVMVI TVATLVSLLI DCLGIVLELN GVLCATPLIF IIPSACYLKL 

SEEPRTHSDK IMSCVMLPIG AWMVFGFVM AITNTQDCTH GQEMFYCFPD NFSLTNTSES 

HVQQTTQLST LNISIFQLE 

Seq ID NO: 676 DNA sequence 

Nucleic Acid Accession #; NM_006853.1 

Coding sequence: 26.. 874 

1 11 21 31 41 51 

111111 
AGGAATCTGC GCTCGGGTTC CGCAGATGCA GAGGTTGAGG TGGCTGCGGG ACTGGAAGTC 

ATCGGGCAGA GGTCTCACAG CAGCCAAGGA ACCTGGGGCC CGCTCCTCCC CCCTCCAGGC 

CATGAGGATT CTGCAGTTAA TCCTGCTTGC TCTGG CAACA GGGCTTGTAG GGGGAGAGAC 

CAGGAT CAT C AAGGGGTTCG AGTGCAAGCC TCACTCCCAG CCCTGGCAGG CAGCCCTGTT 

CGAGAAGACG CGGCTACTCT GTGGGGCGAC GCTCATCGCC CCCAGATGGC TCCTGACAGC 

AGCCCACTGC CTCAAGCCCC GCTACATAGT TCACCTGGGG CAGCACAACC TCCAGAAGGA 

GGAGGGCTGT GAGCAGACCC GGACAGCCAC TGAGTCCTTC CCCCACCCCG GCTTCAACAA 

CAGCCTCCCC AACAAAGACC ACCGCAATGA CATCATGCTG GTGAAGATGG CATCGCCAGT 

CTCCATCACC TGGGCTGTGC GACCCCTCAC CCTCTCCTCA CGCTGTGTCA CTGCTGGCAC 

CAGCTGCCTC ATTTCCGGCT GGGGCAGCAC GTCCAGCCCC CAGTTACGCC TGCCTCACAC 

CTTGCGATGC GCCAACATCA CCATCATTGA GCACCAGAAG TGTGAGAACG CCTACCCCGG 

CAACATCACA GACACCATGG TGTGTGCCAG CGTGCAGGAA GGGGGCAAGG ACTCCTGCCA 

GGGTGACTCC GGGGGCCCTC TGGTCTGTAA CCAGTCTCTT CAAGGCATTA TCTCCTGGGG 

CCAGGATCCG TGTGCGATCA CCCGAAAGCC TGGTGTCTAC ACGAAAGTCT GCAAATATGT 

GGACTGGATC CAGGAGACGA TGAAGAACAA TTAGACTGGA CCCACCCACC ACAGCCCATC 

ACCCTCCATT TCCACTTGGT GTTTGGTTCC TGTTCACTCT GTTAATAAGA AACCCTAAGC 

CAAGACCCTC TACGAACATT CTTTGGGCCT CCTGGACTAC AGGAGATGCT GTCACTTAAT 

AATCAACCTG GGGTTCGAAA TCAGTGAGAC CTGGATTCAA ATTCTGCCTT GAAATATTGT 

GACTCTGGGA ATGACAACAC CTGGTTTGTT CTCTGTTGTA TCCCCAGCCC CAAAGACAGC 

TCCTGGCCAT ATATCAAGGT TTCAATAAAT ATTTGCTAAA TGAGTG 

Seq ID NO: 677 Protein sequence 
Protein Accession #: NP_006844.1 

1 11 21 31 41 51 

1 I I I I I 

MRILQLILLA LATGLVGGET RIIKGFECKP HSQPWQAALF EKTRLLCGAT LIAPRWLLTA 
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AHCLKPRY IV HLGQHNLQKE EGCEQTRTAT ESFPHPGFNN SLPNKDHRND IMLVKMASPV 
SITWAVRPLT LSSRCVTAGT SCLISGWGST SSPQLRLPHT LRCANITIIE HQKCENAYPG 
NITDTMVCAS VQEGGKDSCQ GDSGGPLVCN QSLQGIISWG QDPCAITRKP GVYTKVCKYV 
DWIQETMKNN 

Seq ID NO: 67 8 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 1..933 



120 
180 
240 



1 
I 

ATGTGCAGCA 

TTCGACAAGA 

TTCCCCTGTG 

GACTGTCCCG 

GCCCGCTACC 

AATAACTGTC 

GGGCAGGTGT 

ATCAT CGGCA 

CACCAGCGGA 

CTGCTGTCCC 

AATAATGGCA 

CCACCCTCCT 

CCGCCCTACT 

CGGTCCGGGA 

GACACCAGCC 

TCTGAGCCGA 



11 
I 

ATGGACGGTG 

GTGATGAGAA 

CCAGCGGCAT 

ATGGCAGCGA 

ACTGCAAGAA 

AAGACAACAG 

TTGTGACTTC 

GCTCCGTCAT 

AGCGGAACAA 

GCCTGGTGGT 

TCCAGTATGT 

ACTCCGAGGC 

CTTCTGACAC 

GTGCCAACAG 

ACAGCCCGGG 

GCCAGGGCAC 



21 
I 

CATCCCGGGC 

GGAGTGCCCC 

CCATTGCATC 

TGAAGAGAAC 

CGGCCTCTGT 

TGATGAGGAA 

AG AG AAC CAA 

TTTTGTGCTG 

CCTCATGACG 

CCTGGACCAC 

GGCCAGCCAG 

CTTGCTGGAC 

GGAAT CTCTG 

TGCCAGCTCC 

GCAGCCTGGC 

TGAAGAAGTA 



31 
I 

GCCTGGCAGT 

AAGGCTAAGT 

ATTGGTCGCT 

TGCACAGCAA 

ATTGACAAGA 

AGCTGTGAAA 

CTTGTGTATT 

GTGGTGGCCC 

CTGCCCGTGC 

CCCCACCACT 

GCGGAGCAGA 

CAGAGGCCTG 

AACCAAGCCG 

CAGGCAGCCA 

CCCCAGGAGG 

TAA 



41 
i 

GTGACGGGCT 

CGAAATGTGG 

TCCGGTGCAA 

ACCCTCTGCT 

GCTTCATCTG 

GTTCTCAAGA 

ACCCCAGCAT 

TGCTGGCACT 

ACCGGCTGCA 

GCAACGT CAC 

ATGCGTCGGA 

CGTGGTATGA 

ACCTGCCCCC 

GCAGCCTCCT 

GCACTGCTGA 



51 

r 

GCCTGACTGC 

CCCGACCTTC 

TGGGTTTGAG 

TTGCTCCACC 

CGATGGACAG 

ACCCGGCAGT 

CACCTATGCC 

GGTCTTGCAC 

GCACCCTGTG 

CTACAACGTC 

AGTAGGCTCC 

CCTTCCTCCA 

CTACCGCTCC 

GAGCGTGGAA 

GCCCAGGGAC 



Seq ID NO: 67 9 Protein sequence 
Protein Accession #: Eos sequence 



MCSNGRCIPG 
DCPDGSDEEN 
GQVFVTSENQ 
LLSRLWLDH 
PPYSSDTESL 
SEPSQGTEEV 



11 
I 

AWQCDGLPDC 
CTANPLLCST 
LVYYPSITYA 
PHHCNVTYNV 
NQADLPPYRS 



21 

I 

FDKSDEKECP 
ARYHCKNGLC 
IIGSSVIFVL 
NNGIQYVASQ 
RSGSANSASS 



31 



41 



KAKSKCGPTF 
IDKSFICDGQ 
WALXjALVLH 
AEQNASEVGS 
QAASSLLSVE 



FPCASGIHCI 
NNCQDNSDEE 
HQRKRNNLMT 
PPSYSEALLD 
DTSHSPGQPG 



51 
I 

IGRFRCNGFE 
SCESSQEPGS 
LPVHRLQHPV 
QRPAWYDLPP 
PQEGTAEPRD 



Seq ID NO: 680 DNA sequence 
Nucleic Acid Accession #: S78203.1 
Coding sequence: 1..2190 



l 

ATGAATCCTT 
GAGGTACCAC 
AACTATCCAC 
TATGGAATGA 
ACCTCCACAT 
GCAGCCATTG 
TATGTGCTTG 
GTACACACAG 
AAACCCTGTG 
ACTAGATACT 
ATCACACCCA 
TTTGGAGTTC 
ATATACAATA 
TTTGCTATTT 
CTAGACTGGG 
AGGGTACTAT 
TCACGATGGA 
CCGGACCAGA 
TTTGTCATTT 
GCTGTTGGTA 
ATAAATGAAA 
CTGGCAGATG 
GAGTCCATCA 
AGCCAGGATT 
GTGCAGGAGA 
ATGATGGTAA 
AACACTTTGC 
GAAGACT AT G 
TGTAGAACAG 
TATCTGTTTG 
ATTCCAGCCA 
GGGGAGGTCA 
ATGAAATCTG 
CTTGTTGTGG 
CTCCTGCTGG 
ACAGAGGATA 
AAACTAGAGA 



11 



21 



t . I 
TCCAGAAAAA 

CTCGACCACC 

TGAGCATTGC 

AAGCTGTGCT 

CTATATACCA 

CTGACTCGTG 

GCCATGTGAT 

TCCTATCATT 

TGGCAGCTTT 

TCTCAGTCTT 

TGCTGAGAGG 

CAGGACTGCT 

AACCACCCCC 

CCAATCGTTT 

CAGCTGAGAA 

TCCTTTATAT 

CTTTGCAAGC 

TGCAGGTTCT 

ATCGTCTGGT 

TGATCCTAGC 

TGGCCCCAGC 

ATGAGGTGAA 

AATCCTTTCA 

TTCACTTCCA 

AGAACTGGTA 

AGGATACAGA 

ATAAAGATGT 

GTGTGTCTGC 

AAGATAAGAA 

TTATTACTAA 

ACAAAATGTC 

TGTTCTCTGT 

TGCTCCAGGC 

CACAGTTCAG 

TGATCTGCCT 

TGCGGGGTCC 

CCAAGAAGAC 



TGAGTCCAAG 
TAGCCCTCCA 
CTTCATTGTG 
GAT CCTGT AT 
TGCCTTCAGC 
GTTGGGAAAA 
CAAGTCCTTG 
GATCGGCCTG 
TGGTGGAGAC 
CTACCTGTCC 
AGATGTGCAA 
CATGGTAATT 
TGAAGGAAAC 
CAAGAACCGT 
AT AT CCAAAG 
CCCATTGCCC 
CAT CAGGATG 
AAATCCCTTT 
CTCCAAGTGT 
GTGCCTGGCA 
CCAGTCAGGT 
GGTGACAGTG 
GAAAACACCA 
CCTGAAATAT 
CAGTCTTGTC 
AAGCAAAACA 
CAACATCTCC 
TTATAGAACT 
CTTTTCTCTG 
TAACACCAAT 
CATTGCGTGG 
CACAGGTCTT 
AGCTTGGCTA 
TGGCCTGGTA 
GATCTTCTCC 
AGCAGATAAG 
AAAACT CTGA 



31 
I 

GAAACTCTTT 
AAG AAG C CAT 
GTGAATGAAT 
TTCCTGTATT 
AGCCTCTGTT 
TTCAAGACAA 
GGTGCCTTAC 
AGTCTAATAG 
CAGTTTGAAG 
ATCAATGCAG 
TGTTTTGGAG 
GCACTTGTTG 
ATAGTGGCTC 
TCTGGAGACA 
CAGCTCATTA 
ATGTTCTGGG 
AATAGGAATT 
CTGGTTCTTA 
GGAATTAACT 
TTTGCAGTTG 
CCCCAGGAGG 
GTGGGAAATG 
CACTATTCCA 
CACAATTTGT 
ATTCGTGAAG 
ACCAATGGGA 
CTGAGTACAG 
GTGCAAAGAG 
AATTTGGGTC 
CAGGGTCTTC 
CAGCTACCAC 
GAGTTTTCTT 
TTGACAATTG 
CAGTGGGCCG 
ATCATGGGCT 
CACATTCCTC 



41 51 

I 

TTTCACCTGT 
CTCCGACAAT 
TCTGCGAGCG 
TCCTGCACTG 
ATTTTACTCC 
TCATCTATCT 
CAATACTGGG 
CTTTGGGGAC 
AAAAACATGC 
GGAGCTTGAT 
AAGACTGCTA 
TGTTTGCAAT 
AAGTTTTCAA 
TTCCAAAGCG 
TGGATGTAAA 
CTCTTTTGGA 
TGGGGTTTTT 
TCTTCATCCC 
TCTCATCACT 
CGGCAGCTGT 
TTTTCCTACA 
AAAACAATTC 
AACTGCACCT 
CTCTCTACAC 
ATGGGAACAG 
TGACAACCGT 
ATACCTCTCT 
GAGAATACCC 
TTCTAGACTT 
AGGCCTGGAA 
AATATG CCCT 
ATT CT CAGG C 
CAGTTGGGAA 
AATTCATTTT 
ACTACTATGT 
ACATCCAGGG 



I 

CTCCATTGAA 
CTGTGGCTCC 
CTTTTCCTAT 
GAATGAAGAT 
CATCCTGGGA 
CTCCTTGGTG 
AGGACAAGTG 
AGGAGGCATC 
AGAGGAACGG 
TTCTACATTT 
TGCATTGGCT 
GGGAAGCAAA 
ATGTATCTGG 
ACAGCACTGG 
GGCACTGACC 
TCAGCAGGGT 
TGTGCTTCAG 
GTTGTTTGAC 
TAGGAAAATG 
AGAGATAAAA 
AGTCTTGAAT 
TCTGTTGATA 
GAAAACAAAA 
TGAG CATTCT 
TATCTCCAGC 
GAGGTTTGTT 
CAATGTTGGT 
TGCAGTGCAC 
TGGTGCAGCA 
GATTGAAGAC 
GGTTACAGCT 
TCCCTCTAGC 
TATCATCGTG 
GTTTTCCTGC 
TCCTGTAAAG 
GAACATGATC 
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Seq ID NO: 681 Protein sequence 
Protein Accession #: AAB34388.1 
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1 11 21 

I I I 

MNPFQKNESK ETLFSPVSIE EVPPRPPSPP 
YGMKAVLILY FLYFLHWNED TSTSIYHAFS 
YVLGHVIKSL GALPILGGQV VHTVLSLIGL 
TR YFSVFYLS INAGSLISTF ITPMLRGDVQ 
IYNKPPPEGN IVAQVFKCIW FAI SNRFKNR 
RVLFLYIPLP MFWALLDQQG SRWTLQAIRM 
FVIYRLVSKC GINFSSLRKM AVGMILACLA 
LADDEVKVTV VGNENNSLLI ESIKSFQKTP 
VQEKNWYSLV IREDGNSISS MMVKDTESKT 
EDYGVSAYRT VQRGEYPAVH CRTEDKNFSL 
IPANKMSIAW QLPQYALVTA GEVMFSVTGL 
LWAQFSGIiV QWAEFILFSC LLLVICLIFS 
KLETKKTKL 

Seq ID NO: 682 DNA sequence 
Nucleic Acid Accession #: NM_016077.1 
Coding sequence : 128 . . 667 

1 11 21 31 41 51 

I l I I I I 

TCGCTTTGTG ATTCTTGATC CGGAACTTTG TCACCCAGGA ACCCCGGAAG AGGTAGCTCA 
CGCGATAGAA ACGTGTTCGC TTGCCCAGAA GAAGGGAAGG CGCGAGTGAG GAAAGGAGGT 
ACTGTAGATG CCCTCCAAAT CCTTGGTTAT GGAATATTTG GCTCATCCCA GTACACTCGG 
CTTGGCTGTT GGAGTTGCTT GTGGCATGTG CCTGGGCTGG AGCCTTCGAG TATGCTTTGG 
GATGCTCCCC AAAAGCAAGA CGAGCAAGAC ACACACAGAT ACTGAAAGTG AAG CAAG CAT 
CTTGGGAGAC AGCGGGGAGT ACAAGATGAT TCTTGTGGTT CGAAATGACT TAAAGATGGG 
AAAAGGGAAA GTGGCTGCCC AGTGCTCTCA TGCTGCTGTT TCAGCCTACA AGCAGATTCA 
AAGAAGAAAT CCTGAAATGC TCAAACAATG GGAATACTGT GGCCAGCCCA AGGTGGTGGT 
CAAAGCTCCT GATGAAGAAA CCCTGATTGC ATTATTGGCC CATGCAAAAA TGCTGGGACT 
GACTGTAAGT TTAATT CAAG ATGCTGGACG TACTCAGATT GCACCAGGCT CTCAAACTGT 
CCTAGGGATT GGGCCAGGAC CAGCAGACCT AATTGACAAA GTCACTGGTC ACCTAAAACT 
TTACTAGGTG GACTTTGATA TGACAACAAC CCCTCCATCA CAAGTGTTTG AAGCCTGTCA 
GATTCTAACA ACAAAAG CTG AATTTCTTCA CCCAACTTAA ATGTTCTTGA GATGAAAATA 
AAACCTATTC CCATGTTCTA AAAAAA 

Seq ID NO: 683 Protein sequence 
Protein Accession #: NP_057161.1 

1 11 21 31 41 51 

l l I l l I 

MPSKSLVMEY LAHPSTLGLA VGVACGMCLG WSLRVCFGML PKSKTSKTHT DTESEASILG 
DSGEYKMILV VRNDLKMGKG KVAAQCSHAA VSAYKQIQRR NPEMLKQWEY CGQPKVWKA 
PDEETLIALL AHAKMLGLTV SLIQDAGRTQ IAPGSQTVLG IGPGPADLID KVTGHLKLY 

Seq ID NO: 684 DNA sequence 

Nucleic Acid Accession #: NM_004864.1 

Coding sequence: 26 ,.952 

1 11 21 31 41 51 

I I I I I I 

CGGAACGAGG GCAACCTGCA CAGCCATGCC CGGGCAAGAA CTCAGGACGG TGAATGGCTC 
TCAGATGCTC CTGGTGTTGC TGGTGCTCTC GTGGCTGCCG CATGGGGGCG CCCTGTCTCT 
GGCCGAGGCG AGCCGCGCAA GTTTCCCGGG ACCCTCAGAG TTGCACTCCG AAGACTCCAG 
ATTCCGAGAG TTGCGGAAAC GCTACGAGGA CCTGCTAACC AGGCTGCGGG CCAACCAGAG 
CTGGGAAGAT TCGAACACCG ACCTCGTCCC GGCCCCTGCA GT CCGGAT AC TCACGCCAGA 
AGTGCGGCTG GGATCCGGCG GCCACCTGCA CCTGCGTATC TCTCGGGCCG CCCTTCCCGA 
GGGGCTCCCC GAGGCCTCCC GCCTTCACCG GGCTCTGTTC CGGCTGTCCC CGACGGCGTC 
AAGGTCGTGG GACGTGACAC GACCGCTGCG GCGTCAGCTC AGCCTTGCAA GACCCCAAGC 
GCCCGCGCTG CACCTGCGAC TGTCGCCGCC GCCGTCGCAG TCGGACCAAC TGCTGGCAGA 
ATCTTCGTCC GCACGGCCCC AGCTGGAGTT GCACTTGCGG CCGCAAGCCG CCAGGGGGCG 
CCGCAGAGCG CGTGCGCGCA ACGGGGACGA CTGTCCGCTC GGGCCCGGGC GTTGCTGCCG 
TCTGCACACG GTCCGCGCGT CGCTGGAAGA CCTGGGCTGG GCCGATTGGG TGCTGTCGCC 
ACGGGAGGTG CAAGTGACCA TGTGCATCGG CGCGTGCCCG AGCCAGTTCC GGGCGGCAAA 
CATGCACGCG CAGATCAAGA CGAGCCTGCA CCGCCTGAAG CCCGACACGG AGCCAGCGCC 
CTGCTGCGTG CCCGCCAGCT ACAATCCCAT GGTGCTCATT CAAAAGACCG ACACCGGGGT 
GTCGCTCCAG ACCTATGATG ACTTGTTAGC CAAAGACTGC CACTGCATAT GAGCAGTCCT 
GGTCCTTCCA CTGTGCACCT GCGCGGGGGA GGCGACCTCA GTTGTCCTGC CCTGTGGAAT 
GGGCTCAAGG TTCCTGAGAC ACCCGATTCC TGCCCAAACA GCTGTATTTA TATAAGTCTG 
TTATTTATTA TTAATTTATT GGGGTGACCT TCTTGGGGAC TCGGGGGCTG GTCTGATGGA 
ACTGTGTATT TATTTAAAAC TCTGGTGATA AAAATAAAGC TGTCTGAACT GTTAAAAAAA 
AAAA 

Seq ID NO: 685 Protein sequence 
Protein Accession #: NP_004855.1 

1 11 21 31 41 

I I I I I 

MPGQELRTVN GSQMLLVLLV LSWLPHGGAL SLAEASRASF PGPSELHSED 

EDLLTRLRAN QSWEDSNTDL VPAPAVRILT PEVRLGSGGH LHLRISRAAL 

HRALtFRLSPT ASRSWDVTRP LRRQLSLARP QAPALHLRLS PPPSQSDQLL 

ELHLRPQAAR GRRRARARNG DDCPLGPGRC CRDHTVRASL EDLGWADWVL 

IGACPSQFRA ANMHAQIKTS LHRLKPDTEP APCCVPASYN PMVLIQKTDT 

LAKDCHCI 

Seq ID NO: 686 DNA sequence 
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! 

KKPSPTICGS 
SLCYFTPILG 
SLIALGTGGI 
CFGEDCYALA 
SGDIPKRQHW 
NRNLGFFVLQ 
FAVAAAVE I K 
HYSKLHLKTK 
TNGMTTVRFV 
NLGLLDFGAA 
EFSYSQAPSS 
IMGYYYVPVK 



41 
I 

NYPLSIAFIV 
AAIADSWLGK 
KPCVAAFGGD 
FGVPGLLMVI 
LDWAAEKYPK 
PDQMQVLNPF 
INEMAPAQSG 
SQDFHFHLKY 
NTLHKDVNIS 
YLFVITNNTN 
MKSVLQAAWL 
TEDMRGPADK 



51 

i 

VNEFCERFSY 
FKTIIYLSLV 
QFEEKHAEER 
ALWFAMGSK 
QLIMDVKALT 
LVLIFIPLFD 
PQEVFLQVLN 
HNLSLYTEHS 
LSTDTSLNVG 
QGLQAWKIED 
LTIAVGNIIV 
HIPHIQGNMI 



51 
I 

SRFRELRKRY 
P EGLPEASRIi 
AESSSARPQL 
SPREVQVTMC 
GVSLQTYDDL 
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Nucleic Acid Accession #: NM__002423.2 
Coding sequence; 4 8.. 8 51 

1 11 21 31 41 51 
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ACCAAATCAA CCATAGGTCC AAGAACAATT GTCTCTGGAC GGCAGCTATG CGACTCACCG 
TGCTGTGTGC TGTGTGCCTG CTGCCTGGCA GCCTGGCCCT GCCGCTGCCT CAGGAGGCGG 
GAGGCATGAG TGAGCTACAG TGGGAACAGG CTCAGGACTA TCTCAAGAGA TTTTATCTCT 
ATGACTCAGA AACAAAAAAT GCCAACAGTT TAGAAGCCAA ACTCAAGGAG ATGCAAAAAT 
10 TCTTTGGCCT ACCTATAACT GGAATGTTAA ACTCCCGCGT CATAGAAATA ATGCAGAAGC 

CCAGATGTGG AGTGCCAGAT GTTGCAGAAT ACTCACTATT TCCAAATAGC CCAAAATGGA 
CTTCCAAAGT GGTCACCTAC AGGATCGTAT CATATACTCG AGACTTACCG CATATTACAG 
TGGATCGATT AGTGTCAAAG GCTTTAAACA TGTGGGGCAA AGAGAT CCCC CTGCATTTCA 
GGAAAGTTGT ATGGGGAACT GCTGACATCA TGATTGGCTT TGCGCGAGGA GCTCATGGGG 
15 ACTCCTACCC ATTTGATGGG CCAGGAAACA CGCTGGCTCA TGCCTTTGCG CCTGGGACAG 

GTCTCGGAGG AGATGCTCAC TTCGATGAGG ATGAACGCTG GACGGATGGT AGCAGTCTAG 
GGATTAACTT CCTGTATGCT GCAACTCATG AACTTGGCCA TTCTTTGGGT ATGGGACATT 
CCTCTGATCC TAATGCAGTG ATGTATCCAA CCTATGGAAA TGGAGATCCC CAAAATTTTA 
AACTTTCCCA GGATGATATT AAAGGCATTC AGAAACTATA TGGAAAGAGA AGTAATTCAA 
20 GAAAGAAATA GAAACTTCAG GCAGAACATC CATTCATTCA TTCATTGGAT TGTATATCAT 

TGTTGCACAA TCAGAATTGA TAAGCACTGT TCCTCCACTC CATTTAGCAA TTATGTCACC 
CTTTTTTATT GCAGTTGGTT TTTGAATGTC TTTCACTCCT TTTATTGGTT AAACTCCTTT 
ATGGTGTGAC TGTGTCTTAT TCCATCTATG AGCTTTGTCA GTGCGCGTAG ATGTCAATAA 
ATGTTACATA CACAAATAAA TAAAATGTTT ATTCCATGGT AAATTTA 



25 



40 



Seq ID NO: 687 Protein sequence 
Protein Accession #: NP 002414.1 



1 11 21 31 41 51 

30 | | i | ) | 

MRLTVLCAVC LLPGSLALPIi PQEAGGMSEL QWEQAQDYLK RFYLYDSETK NANSLEAKLK 

EMQKFFGLPI TGMLNSRVIE IMQKPRCGVP DVAEYSLFPN SPKWTSKWT YRIVSYTRDL 

PHITVDRLVS KALNMWGKE I PLHFRKWWG TADIMIGFAR GAHGDSYPFD GPGNTLAHAF 

APGTGLGGDA HFDEDERWTD GSSLGINFLY AATHELGHSL GMGHSSDPNA VMYPTYGNGD 

35 PQNFKLSQDD IKGIQKLYGK RSNSKKK 



Seq ID NO: 688 DNA sequence 

Nucleic Acid Accession #: NM_005221.3 

Coding sequence: 1..870 



1 11 21 31 41 51 

I I l I I I 

ATGACAGGAG TGTTTGACAG AAGGGTCCCC AGCATCCGAT CCGGCGACTT CCAAGCTCCG 
TTCCAGACGT CCGCAGCTAT GCACCATCCG TCT CAGGAAT CGCCAACTTT GCCCGAGTCT 

45 TCAGCTACCG ATTCTGACTA CTACAGCCCT ACGGGGGGAG CCCCGCACGG CTACTGCTCT 

CCTACCTCGG CTTCCTATGG CAAAGCTCTC AACCCCTACC AGTATCAGTA TCACGGCGTG 
AACGGCTCCG CCGGGAGCTA CCCAGCCAAA GCTTATGCCG ACTATAGCTA CGCTAGCTCC 
TACCACCAGT ACGGCGGCGC CTACAACCGC GTCCCAAGCG CCACCAACCA GCCAGAGAAA 
GAAGTGACCG AGCCCGAGGT GAGAATGGTG AATGGCAAAC CAAAGAAAGT TCGTAAACCC 

50 AGGACTATTT ATTCCAGCTT TCAGCTGGCC G CAT TACAGA GAAGGTTTCA GAAGACTCAG 

TACCTCGCCT TGCCGGAACG CGCCGAGCTG GCCGCCTCGC TGGGATTGAC ACAAACACAG 
GTGAAAATCT GGTTTCAGAA CAAAAGATCC AAGATCAAGA AGATCATGAA AAACGGGGAG 
ATGCCCCCGG AGCACAGTCC CAGCTCCAGC GACCCAATGG CGTGTAACTC GCCGCAGTCT 
CCAGCGGTGT GGGAGCCCCA GGGCTCGTCC CGCTCGCTCA GCCACCACCC TCATGCCCAC 

55 CCTCCGACCT CCAACCAGTC CCCAGCGTCC AGCTACCTGG AGAACTCTGC ATCCTGGTAC 

ACAAGTGCAG CCAGCTCAAT CAATTCCCAC CTGCCGCCGC CGGGCTCCTT ACAGCACCCG 
CTGGCGCTGG CCTCCGGGAC ACTCTATTAG 

Seq ID NO: 689 Protein sequence 
60 Protein Accession #: NP_005212,1 

1 11 21 31 41 51 

I i I i I I 

MTGVFDRRVP SIRSGDFQAP FQTSAAMHHP SQESPTLPES SATDSDYYSP TGGAPHGYCS 

65 PTSASYGKAL NPYQYQYHGV NGSAGSYPAK AYADYSYASS YHQYGGAYNR VPSATNQPEK 

EVTEPEVRMV NGKPKKVRKP RTIYSSFQLA ALQRRFQKTQ YLALPERAEL AASLGLTQTQ 

VKIWFQNKRS KIKKIMKNGE MPPEHSPSSS DPMACNSPQS PAVWEPQGSS RSLSHHPHAH 

PPTSNQSPAS SYLENSASWY TSAASSINSH LPPPGSLQHP LALASGTLY 



WO 02/086443 



PCT/US02/12476 



It is understood that the examples described above in no way serve to limit the true 
scope of this invention, but rather are presented for illustrative purposes. All publications, 
sequences of accession numbers, and patent applications cited in this specification are herein 
ncorporated by reference as if each individual publication or patent application were 
specifically and individually indicated to be incorporated by reference. 
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WHAT IS CLAIMED IS: 

1 LA method of detecting a lung cancer-associated transcript in a cell 

2 from a patient, the method comprising contacting a biological sample from the patient with a 

3 polynucleotide that selectively hybridizes to a sequence at least 80% identical to a sequence 

4 as shown in Tables 1 A-16. 

1 2. The method of claim 1, wherein the polynucleotide selectively 

2 hybridizes to a sequence at least 95% identical to a sequence as shown in Tables 1A-16. 

1 3. The method of claim 1, wherein the biological sample is a tissue 

2 sample. 

1 4. The method of claim 1, wherein the biological sample comprises 

2 isolated nucleic acids. 

* 

1 5. The method of claim 4, wherein the nucleic acids are mRNA. 

1 6. The method of claim 4, further comprising the step of amplifying 

2 nucleic acids before the step of contacting the biological sample with the polynucleotide. 

1 7. The method of claim 1, wherein the polynucleotide comprises a 

2 sequence as shown in Tables 1 A-16. 

1 8. The method of claim I, wherein the polynucleotide is labeled. 

1 9. The method of claim 8, wherein the label is a fluorescent label. 

1 10. The method of claim 1, wherein the polynucleotide is immobilized on 

2 a solid surface. 

1 11. The method of claim 1, wherein the patient is undergoing a therapeutic 

2 regimen to treat lung cancer. 

1 12. The method of claim 1, wherein the patient is suspected of having lung 

2 cancer. 

1 13. A method of monitoring the efficacy of a therapeutic treatment of lung 

2 cancer, the method comprising the steps of: 
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3 (i) providing a biological sample from a patient undergoing the therapeutic 

4 treatment; and 

5 (ii) determining the level of a lung cancer-associated transcript in the 

6 biological sample by contacting the biological sample with a polynucleotide that selectively 

7 hybridizes to a sequence at least 80% identical to a sequence as shown in Tables 1 A- 16, 

8 thereby monitoring the efficacy of the therapy. 

1 14. The method of claim 13, further comprising the step of: (iii) comparing 

2 the level of the lung cancer-associated transcript to a level of the lung cancer-associated 

3 transcript in a biological sample from the patient prior to, or earlier in, the therapeutic 

4 treatment. 

1 15. The method of claim 13, wherein the patient is a human. 

1 16. A method of monitoring the efficacy of a therapeutic treatment of lung 

2 cancer, the method comprising the steps of: 

3 (i) providing a biological sample from a patient undergoing the therapeutic 

4 treatment; and 

5 (ii) determining the level of a lung cancer-associated antibody in the biological 

6 sample by contacting the biological sample with a polypeptide encoded by a polynucleotide 

7 that selectively hybridizes to a sequence at least 80% identical to a sequence as shown in 

8 Tables 1 A- 16, wherein the polypeptide specifically binds to the lung cancer-associated 

9 antibody, thereby monitoring the efficacy of the therapy. 

1 17. The method of claim 16, further comprising the step of: (iii) comparing 

2 the level of the lung cancer-associated antibody to a level of the lung cancer-associated 

3 antibody in a biological sample from the patient prior to, or earlier in, the therapeutic 

4 treatment. 

1 18. The method of claim 1 6, wherein the patient is a human. 

1 1 9. A method of monitoring the efficacy of a therapeutic treatment of lung 

2 cancer, the method comprising the steps of: 

3 (i) providing a biological sample from a patient undergoing the therapeutic 

4 treatment; and 
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5 (ii) determining the level of a lung cancer-associated polypeptide in the 

6 biological sample by contacting the biological sample with an antibody, wherein the antibody 

7 specifically binds to a polypeptide encoded by a polynucleotide that selectively hybridizes to 

8 a sequence at least 80% identical to a sequence as shown in Tables 1A-16, thereby 

9 monitoring the efficacy of the therapy. 

1 20. The method of claim 19, further comprising the step of: (iii) comparing 

2 the level of the lung cancer-associated polypeptide to a level of the lung cancer- associated 

3 polypeptide in a biological sample from the patient prior to, or earlier in, the therapeutic 

4 treatment. 

1 21. The method of claim 1 9, wherein the patient is a human. 

1 22. An isolated nucleic acid molecule consisting of a polynucleotide 

2 sequence as shown in Tables 1A-16. 

1 23. The nucleic acid molecule of claim 22, which is labeled. 

1 24. The nucleic acid of claim 23, wherein the label is a fluorescent label 

1 25. An expression vector comprising the nucleic acid of claim 22. 

1 26. A host cell comprising the expression vector of claim 25. 

1 27. An isolated polypeptide which is encoded by a nucleic acid molecule 

2 having polynucleotide sequence as shown in Tables 1 A-l 6. 

1 28. An antibody that specifically binds a polypeptide of claim 27. 

1 29. The antibody of claim 28, further conjugated to an effector component. 

1 30. The antibody of claim 29, wherein the effector component is a 

2 fluorescent label. 

1 31. The antibody of claim 29, wherein the effector component is a 

2 radioisotope or a cytotoxic chemical. 

1 32. The antibody of claim 29, which is an antibody fragment. 
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1 33 . The antibody of claim 29, which is a humanized antibody 

1 34. A method of detecting a lung cancer cell in a biological sample from a 

2 patient, the method comprising contacting the biological sample with an antibody of claim 

3 28. 

1 35. The method of claim 34, wherein the antibody is further conjugated to 

2 an effector component. 

1 36. The method of claim 35, wherein the effector component is a 

2 fluorescent label. 

1 37. A method of detecting antibodies specific to lung cancer in a patient, 

2 the method comprising contacting a biological sample from the patient with a polypeptide 

3 encoded by a nucleic acid comprises a sequence from Tables 1 A- 16. 

1 38. A method for identifying a compound that modulates a lung cancer- 

2 associated polypeptide, the method comprising the steps of: 

3 (i) contacting the compound with a lung cancer-associated polypeptide, the 

4 polypeptide encoded by a polynucleotide that selectively hybridizes to a sequence at least 

5 80% identical to a sequence as shown in Tables 1A-16; and 

6 (ii) determining the functional effect of the compound upon the polypeptide. 

1 39. The method of claim 38, wherein the functional effect is a physical 

2 effect. 

1 40. The method of claim 38, wherein the functional effect is a chemical 

2 effect. 

1 41 . The method of claim 38, wherein the polypeptide is expressed in a 

2 eukaryotic host cell or cell membrane. 

1 42. The method of claim 38, wherein the functional effect is determined by 

2 measuring ligand binding to the polypeptide. 

1 43 . The method of claim 3 8, wherein the polypeptide is recombinant. 
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1 44. A method of inhibiting proliferation of a lung cancer-associated cell to 

2 treat lung cancer in a patient, the method comprising the step of administering to the subject a 

3 therapeutically effective amount of a compound identified using the method of claim 38. 

1 45. The method of claim 44, wherein the compound is an antibody. 

1 46. The method of claim 45, wherein the patient is a human. 

1 47. A drug screening assay comprising the steps of 

2 (i) administering a test compound to a mammal having lung cancer or a cell 

3 isolated therefrom; 

4 (ii) comparing the level of gene expression of a polynucleotide that selectively 

5 hybridizes to a sequence at least 80% identical to a sequence as shown in Tables 1 A- 16 in a 

6 treated cell or mammal with the level of gene expression of the polynucleotide in a control 

7 cell or mammal, wherein a test compound that modulates the level of expression of the 

8 polynucleotide is a candidate for the treatment of lung cancer. 

1 48. The assay of claim 47, wherein the control is a mammal with lung 

2 cancer or a cell therefrom that has not been treated with the test compound. 

1 49. The assay of claim 47, wherein the control is a normal cell or mammal. 

1 50. A method for treating a mammal having lung cancer comprising 

2 administering a compound identified by the assay of claim 47. 

1 5 1 . A pharmaceutiPcal composition for treating a mammal having lung 

2 cancer, the composition comprising a compound identified by the assay of claim 47 and a 

3 physiologically acceptable excipient. 
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FIELD OF THE INVENTION 
The invention relates to the identification of nucleic acid and protein expression 
15 profiles and nucleic acids, products, and antibodies thereto that are involved in lung cancer; 
and to the use of such expression profiles and compositions in diagnosis and therapy of lung 
cancer. The invention further relates to methods for identifying and using agents and/or 
targets that inhibit lung cancer or related conditions. 

20 • BACKGROUND OF THE INVENTION 

Lung cancer is the second most commonly occurring cancer in the United States and 
is the leading cause of cancer-related death. It is estimated that there are over 160,000 new 
cases of lung cancer in the United States every year. Of those who are diagnosed with lung 
cancer, 86 percent will die within five years. Lung cancer is the most common visceral 

25 cancer in men and accounts for nearly one third of all cancer deaths in both men and women. 
In fact, lung cancer accounts for 7% of all deaths, due to any cause, in both men and women. 

Smoking is the primary cause of lung cancer, with more than 80% of lung cancers 
resulting from smoking. About 400 to 500 separate gaseous substances are present in the 
smoke of a non-filter cigarette. The most noteworthy substances include nitrogen oxides, 

30 hydrogen cyanide, formaldehyde, benzene, and toluene. The particles present in cigarette 
smoke contain at least 3,500 individual compounds such as nicotine, tobacco alkaloids 
(nornicotine, anatabine, anabasine), polycyclic aromatic hydrocarbons (e.g., benzo(a)pyrene, 
B(a)P), naphthalenes, aromatic amines, phenols, and tobacco-specific nitrosamines. 
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Tobacco-specific nitrosamines are formed during tobacco curing and processing, and 
are suspected of causing lung cancer in humans. In rodent studies, regardless of the where or 
how it is applied, the tobacco-specific nitrosamine known as NNK produces lung adenomas 
and lung adenocarcinomas. The tobacco-specific nitrosamine known as NNAL also produces 
5 lung adenocarcinomas in rodents. 

Many of the chemicals found in cigarette smoke also affect the nonsmoker inhaling 
"secondhand" or sidestream smoke. Indeed, the smoke inhaled by non-smokers has a 
chemical composition similar to the smoke inhaled by smokers, but, importantly, the 
concentrations of the carcinogenic tobacco-specific nitrosamines are present in higher 
10 concentrations in second hand smoke. For this and other reasons, "passive smoking" is an 
important cause of lung cancer, causing as many as 3,000 lung cancer deaths in nonsmokers 
each year. 

In addition to smoking, other factors thought to be causes of lung cancer include on- 
the-job exposure to carcinogens such as asbestos and uranium, exposure to chemical hazards 
1 5 such as radon, polycyclic aromatic hydrocarbons, chromium, nickel, and inorganic arsenic, 

genetic factors, and diet. 

Histological classification of various lung cancers define the types of cancer that 
begin in the lung. See, e.g., Travis, et al. (1999) Histological Typing of Lung and Pleural 
Tumours (International Histological Classification of Tumours, No 1. Four major cell types 

20 make up more than 88% of all primary lung neoplasms. These are: squamous or epidermoid 
carcinoma, small cell (also called oat cell) carcinoma, adenocarcinoma, and large cell (also 
called large cell anaplastic) carcinoma. The remainder include undifferentiated carcinomas, 
carcinoids, bronchial gland tumors, and other rarer types. The various cell types have 
different natural histories and responses to therapy, and, thus, a correct histologic diagnosis is 

25 the first step of effective treatment. 

Small cell lung cancer (SCLC) accounts for 18-25% of all lung cancers, and occurs 
less frequently than non-small cell lung cancers, and generally spread to distant organs more 
rapidly than non-small cell lung cancer. In general, at the time of presentation small cell lung 
cancers have already spread beyond the beyond the bounds where surgery and curative intent 

30 can be undertaken. Hoever, if identified early enough, these cancers are often responsive to 
chemotherapy and thoracic radiation treatment. 

Non-small cell lung cancers (NSCLC) are the more frequently occurring form of lung 
cancer. They comprise squamous cell carcinoma, adenocarcinoma, and large cell carcinoma 
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and account for more than 75% of all lung cancers. Non-small cell tumors that are localized 
at the time of presentation can sometimes be cured with surgery and/or radiotherapy, but 
usually are not identified until significant metastasis has occurred, which are typically not 
very responsive to surgical, chemotherapy, or radiation treatment.. 
5 The screening of asymptomatic persons at high risk for lung cancer has often proven 

ineffective. In general, only 5 to 15 percent of lung cancer patients have their disease 
detected while they are asymptomatic. Of course, early detection and treatment are critical 
factors in the fight against lung cancer. The average survival rate is 49% for those whose 
cancer is detected early, before the cancer has spread from the lung. Lung cancer often 

10 spreads outside of the lung, and it may have spread to the bones or brain by the time it is 
diagnosed. While the prognosis may be better for lung cancers that are detected early, 
because of the lack ofV effective curative treatments, early detection does not necessarily alter 
the total death rate from lung cancer. 

Thus, methods for diagnosis and prognosis of lung cancer and effective treatment of 

1 5 lung cancer would be desirable. Accordingly, provided herein are methods that can be used 
in diagnosis and prognosis of lung cancer. Further provided are methods that can be used to 
screen candidate therapeutic agents for the ability to modulate, e.g., treat, lung cancer. 
Additionally, provided herein are molecular targets and compositions for therapeutic 
intervention in lung disease and other metastatic cancers. 

20 

SUMMARY OF THE INVENTION 
The present invention provides nucleotide sequences of genes that are up- and down- 
regulated in lung cancer cells. Such genes are useful for diagnostic purposes, and also as 
targets for screening for therapeutic compounds that modulate lung cancer, such as 

25 antibodies. The methods of detecting nucleic acids of the invention or their encoded proteins 
can be used for a number of purposes. Examples include early detection of lung cancers, 
monitoring and early detection of relapse following treatment of lung cancers, monitoring 
response to therapy of lung cancers, determining prognosis of lung cancers, directing therapy 
of lung cancers, selecting patients for postoperative chemotherapy or radiation therapy, 

30 selecting therapy, determining tumor prognosis, treatment, or response to treatment, and early 
detection of precancerous lesions of the lung. Examples of benign or precancerous lesions 
include: atelectasis, emphysema, brochitis, chronic obstructive pulmonary disease, fibrosis, 
hypersensitivity pneumonitis (HP), interstitial pulmonary fibrosis (IPF), asthma, and 



3 



WO 02/086443 PCT7US02/12476 

bronchiectasis. Other aspects of the invention will become apparent to the skilled artisan by 
the following description of the invention. 

In one aspect, the present invention provides a method of detecting a lung cancer- 
associated transcript in a cell from a patient, the method comprising contacting a biological 
5 sample from the patient with a polynucleotide that selectively hybridizes to a sequence at 
least 80% identical to a sequence as shown in Tables 1 A- 16. Alternatively, the sample may 
be contacted with a specific binding reagent, e.g., antibody. 

In one embodiment, the polynucleotide selectively hybridizes to a sequence at least 
95% identical to a sequence as shown in Tables 1A-16. In another embodiment, the 
10 polynucleotide comprises a sequence as shown in Tables 1A-16. 

In one embodiment, the biological sample is a tissue sample, or a body fluid. In 
another embodiment, the biological sample comprises isolated nucleic acids, e.g., mRNA. 

In one embodiment, the polynucleotide is labeled, e.g., with a fluorescent label. In 
one embodiment, the polynucleotide is immobilized on a solid surface. In one embodiment, 
15 the patient is undergoing a therapeutic regimen to treat lung cancer. In another embodiment, 
the patient is suspected of having lung cancer. In one embodiment, the patient is a primate, 
e.g., a human. 

In one embodiment, the method further comprises the step of amplifying nucleic acids 
before the step of contacting the biological sample with the polynucleotide. 

20 In another aspect, the present invention provides a method of monitoring the efficacy 

of a therapeutic treatment of lung cancer, the method comprising the steps of: (i) providing a 
biological sample from a patient undergoing the therapeutic treatment; and (ii) determining 
the level of a lung cancer-associated transcript in the biological sample by contacting the 
biological sample with a polynucleotide that selectively hybridizes to a sequence at least 80% 

25 identical to a sequence as shown in Tables 1 A- 16, thereby monitoring the efficacy of the 
therapy. Or the sample may be evaluated for protein, e.g., contacting the sample with an 
antibody. 

In one embodiment, the method further comprises the step of: (iii) comparing the 
level of the lung cancer-associated transcript to a level of the lung cancer-associated 
30 transcript in a biological sample from the patient prior to, or earlier in, the therapeutic 
treatment. Or the sample may be evalated for comparison of protein. 

In another aspect, the present invention provides a method of monitoring the efficacy 
of a therapeutic treatment of lung cancer, the method comprising the steps of: (i) providing a 
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biological sample from a patient undergoing the therapeutic treatment; and (ii) determining 
the level of a lung cancer-associated antibody in the biological sample by contacting the 
biological sample with a polypeptide encoded by a polynucleotide that selectively hybridizes 
to a sequence at least 80% identical to a sequence as shown in Tables 1A-16, wherein the 
5 polypeptide specifically binds to the lung cancer-associated antibody, thereby monitoring the 
efficacy of the therapy. 

In one embodiment, the method further comprises the step of: (hi) comparing the 
level of the lung cancer-associated antibody to a level of the lung cancer-associated antibody 
in a biological sample from the patient prior to, or earlier in, the therapeutic treatment. 
10 In another aspect, the present invention provides a method of monitoring the efficacy 

of a therapeutic treatment of lung cancer, the method comprising the steps of: (i) providing a 
biological sample from a patient undergoing the therapeutic treatment; and (ii) determining 

> 

the level of a lung cancer-associated polypeptide in the biological sample by contacting the 
biological sample with an antibody, wherein the antibody specifically binds to a polypeptide 

15 encoded by a polynucleotide that selectively hybridizes to a sequence at least 80% identical 
to a sequence as shown in Tables 1 A- 16, thereby monitoring the efficacy of the therapy. 

In one embodiment, the method further comprises the step of: (iii) comparing the 
level of the lung cancer-associated polypeptide to a level of the lung cancer-associated 
polypeptide in a biological sample from the patient prior to, or earlier in, the therapeutic 

20 treatment. In one aspect, the present invention provides an isolated nucleic acid molecule 
consisting of a polynucleotide sequence as shown in Tables 1A-16. In one embodiment, an 
expression vector or cell comprises the isolated nucleic acid. In one aspect, the present 
invention provides an isolated polypeptide which is encoded by a nucleic acid molecule 
having polynucleotide sequence as shown in Tables 1 A- 16. 

25 In another aspect, the present invention provides an antibody that specifically binds to 

an isolated polypeptide which is encoded by a nucleic acid molecule having polynucleotide 
sequence as shown in Tables 1 A-16. In one embodiment, the antibody is conjugated to an 
effector component, e.g., a fluorescent label, a radioisotope or a cytotoxic chemical. In one 
embodiment, the antibody is an antibody fragment. In another embodiment, the antibody is 

30 humanized. 

In one aspect, the present invention provides a method of detecting lung cancer in a a 
patient, the method comprising contacting a biological sample from the patient with an 
antibody or protein as described herein. 
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In another aspect, the present invention provides a method of detecting antibodies 
specific to a lung cancer gene in a patient, the method comprising contacting a biological 
sample from the patient with a polypeptide encoded by a nucleic acid comprises a sequence 
from Tables 1A-16. 

5 In another aspect, the present invention provides a method for identifying a compound 

that modulates a lung cancer-associated polypeptide, the method comprising the steps of: (i) 
contacting the compound with a lung cancer-associated polypeptide, the polypeptide encoded 
by a polynucleotide that selectively hybridizes to a sequence at least 80% identical to a 
sequence as shown in Tables 1 A- 16; and (ii) determining the functional effect of the 

1 0 compound upon the polypeptide. 

In one embodiment, the functional effect is a physical effect, an enzymatic effect, or a 
chemical effect. In one embodiment, the polypeptide is expressed in a eukaryotic host cell or 
cell membrane. In another embodiment, the polypeptide is recombinant. In one 
embodiment, the functional effect is determined by measuring ligand binding to the 

15 polypeptide. 

In another aspect, the present invention provides a method of inhibiting proliferation 
or another critical process of a lung cancer-associated cell to treat lung cancer in a patient, the 
method comprising the step of administering to the subject a therapeutically effective amount 
of a compound identified as described herein. In one embodiment, the compound is an 
20 antibody. 

In another aspect, the present invention provides a drug screening assay comprising 
the steps of: (i) administering a test compound to a mammal having lung cancer or a cell 
isolated therefrom; (ii) comparing the level of gene expression of a polynucleotide that 
selectively hybridizes to a sequence at least 80% identical to a sequence as shown in Tables 
25 1 A- 16 in a treated cell or mammal with the level of gene expression of the polynucleotide in 
a control cell or mammal, wherein a test compound that modulates the level of expression of 
the polynucleotide is a candidate for the treatment of lung cancer. 

In one embodiment, the control is a mammal with lung cancer or a cell therefrom that 
has not been treated with the test compound. In another embodiment, the control is a normal 
30 cell or mammal, or a non-malignant lung disease. 

In another aspect, the present invention provides a method for treating a mammal 
having lung cancer comprising administering a compound identified by the assay described 
herein. 
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In another aspect, the present invention provides a pharmaceutical composition for 
treating a mammal having lung cancer, the composition comprising a compound identified by 
the assay described herein and a physiologically acceptable excipient. 

5 DETAILED DESCRIPTION OF THE INVENTION 

In accordance with the objects outlined above, the present invention provides novel 
methods for diagnosis and treatment of lung disease or cancer, as well as methods for 
screening for compositions which modulate lung cancer. "Treatment, monitoring, detection 
or modulation of lung disease or cancer" includes treatment, monitoring, detection, or 

10 modulation of lung disease in those patients who have lung disease (whether malignant or 

non-malignant, e.g., emphysema, bronchitis, or fibrosis) as well as patients with lung cancers 
in which gene expression from a gene in Tables 1 A- 16 is increased or decreased, indicating 
that the subject is more likely to have disease. In particular,while these targets are identified 
primarily from lung cancer samples, these same targets are likely to be similarly found in 

15 analyses of other medical conditions. These other conditions may result from similar 
pathological processes which affect similar tissues, e.g., lung cancer, small cell lung 
carcinoma (oat cell carcinoma), non-small cell carcinomas (e.g., squamous cell carcinoma, 
adenocarcinoma, large cell lung carcinoma, carcinoid, granulomatous), fibrosis (idiopathic 
pulmonary fibrosis (IPF), hypersensitivity pneumonitis (HP), interstitial pneumonitis, 

20 nonspecific idiopathic pneumonitis (NSIP)), chronic obstructive pulmonary disease (COPD, 
e.g., emphysema, chronic bronchitis), asthma, bronchiectasis, and esophageal cancer. See, 
e.g., the NCI webpage and USSN 60/347,349 and USSN 60/xxx,xxx (docket LFBR-001-1P, 
filed March 29, 2002), each of which is incorporated herein by reference. The treatment may 
be of lung cancer or related condition itself, or treatment of metastasis. 

25 In particular, identification of markers selectively expressed on these cancers allows 

for use of that expression in diagnostic, prognostic, or therapeutic methods. As such, the 
invention defines various compositions, e.g., nucleic acids, polypeptides, antibodies, and 
small molecule agonists/antagonists, which will be useful to selectively identify those 
markers. For example, therapeutic methods may take the form of protein therapeutics which 

30 use the marker expression for selective localization or modulation of function (for those 
markers which have a causative disease effect), for vaccines, identification of binding 
partners, or antagonism, e.g., using antisense or RNAi. The markers may be useful for 
molecular characterization of subsets of lung diseases, which subsets may actually require 
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very different treatments. Moreover, the markers may also be important in related diseases to 
the specific cancers, e.g., which affect similar tissues in non-malignant diseases, or have 
similar mechanisms of induction/maintenance. Metastatic processes or characteristics may 
also be targeted. Diagnostic and prognostic uses are made available, e.g., to subset related 
but distinct diseases, or to determine treatment strategy. The detection methods may be based 
upon nucleic acid, e.g., PCR or hybridization techniques, or protein, e.g., ELISA, imaging, 
IHC, etc. The diagnosis may be qualitative or quantitative, and may detect increases or 
decreases in expression levels. 

Tables 1A-16 provide unigene cluster identification numbers for the nucleotide 
sequence of genes that exhibit increased or decreased expression in lung cancer samples. The 
tables also provide an exemplar accession number that provides a nucleotide sequence that is 
part of the unigene cluster. In Table 1 A, genes marked as "target 1" or "target 2" are 
particularly useful as therapeutic targets. Genes marked as "target 3" are particularly useful 
as diagnostic markers. Genes marked as "chron" are upregulated in chronically diseased lung 
(e.g., emphysema, bronchitis, fibrosis) relative to lung tumors and normal tissue. In certain 
analyses, the ratio for the "chron" category was determined using the 70th percentile of 
chronically diseases lung samples divided by the 90th percentile of normal lung samples. 
The ratio for the targets was determined using the 70th percentile of lung tumor samples 
divided by the 90th percentile of normal lung samples. 

Definitions 

The term "lung cancer protein" or "lung cancer polynucleotide" or "lung cancer- 
associated transcript" refers to nucleic acid and polypeptide polymorphic variants, alleles, 
mutants, and interspecies homologs that: (1) have a nucleotide sequence that has greater than 
about 60% nucleotide sequence identity, 65%, 70%, 75%, 80%, 85%, 90%, preferably 91%, 
92%>, 93%, 94%>, 95%, 96%, 97%, 98%, or 99% or greater nucleotide sequence identity, 
preferably over a region of over a region of at least about 25, 50, 100, 200, 500, 1000, or 
more nucleotides, to a nucleotide sequence of or associated with a unigene cluster of Tables 
1 A-16; (2) bind to antibodies, e.g., polyclonal antibodies, raised against an immunogen 
comprising an amino acid sequence encoded by a nucleotide sequence of or associated with a 
unigene cluster of Tables 1A-16, and conservatively modified variants thereof; (3) 
specifically hybridize under stringent hybridization conditions to a nucleic acid sequence, or 
the complement thereof of Tables 1A-16 and conservatively modified variants thereof; or (4) 
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have an amino acid sequence that has greater than about 60% amino acid sequence identity, 
65%, 70%, 75%, 80%, 85%, 90%, preferably 91%, 92%, 93%, 94%, 95%, 96%, 97%, 98%, 
or 99% or greater amino sequence identity, preferably over a region of over a region of at 
least about 25, 50, 100, 200, 500, 1000, or more amino acid, to an amino acid sequence 
5 encoded by a nucleotide sequence of or associated with a unigene cluster of Tables 1A-16. A 
polynucleotide or polypeptide sequence is typically from a mammal including, but not 
limited to, primate, e.g., human; rodent, e.g., rat, mouse, hamster; cow, pig, horse, sheep, or 
other mammal. A "lung cancer polypeptide" and a "lung cancer polynucleotide," include 
both naturally occurring or recombinant forms. 

10 A "full length" lung cancer protein or nucleic acid refers to a lung cancer polypeptide 

or polynucleotide sequence, or a variant thereof, that contains the elements normally 
contained in one or more naturally occurring, wild type lung cancer polynucleotide or 
polypeptide sequences. The "full length" may be prior to, or after, various stages of post- 
translational processing or splicing, including alternative splicing. 

15 "Biological sample" as used herein is a sample of biological tissue or fluid that 

contains nucleic acids or polypeptides, e.g., of a lung cancer protein, polynucleotide, or 
transcript. Such samples include, but are not limited to, tissue isolated from primates, e.g., 
humans, or rodents, e.g., mice, and rats. Biological samples may also include sections of 
tissues such as biopsy and autopsy samples, frozen sections taken for histologic purposes, 

20 archival materials, blood, plasma, serum, sputum, stool, tears, mucus, hair, skin, etc. 
Biological samples also include explants and primary and/or transformed cell cultures 
derived from patient tissues. A biological sample is typically obtained from a eukaryotic 
organism, most preferably a mammal such as a primate, e.g., chimpanzee or human; cow; 
dog; cat; a rodent, e.g., guinea pig, rat, mouse; rabbit; or other mammal; or a bird; reptile; 

25 fish. Livestock and domestic animals are of interest. 

"Providing a biological sample" means to obtain a biological sample for use in 
methods described in this invention. Most often, this will be done by removing a sample of 
cells from an animal, but can also be accomplished by using previously isolated cells (e.g., 
isolated by another person, at another time, and/or for another purpose), or by performing the 

30 methods of the invention in vivo. Archival tissues or materials, having treatment or outcome 
history, will be particularly useful. 

The terms "identical" or percent "identity," in the context of two or more nucleic 
acids or polypeptide sequences, refer to two or more sequences or subsequences that are the 
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same or have a specified percentage of amino acid residues or nucleotides that are the same 
(e.g., about 60% identity, preferably 70%, 75%, 80%, 85%, 90%, 91%, 92%, 93%, 94%, 
95%, 96%o, 97%, 98%, 99%, or higher identity over a specified region, when compared and 
aligned for maximum correspondence over a comparison window or designated region) as 
5 measured using, e.g., a BLAST or BLAST 2.0 sequence comparison algorithms with default 
parameters described below, or by manual alignment and visual inspection (see, e.g., NCBI 
web site http://www.ncbi.nlm.nih.gov/BLAST/ or the like). Such sequences are then said to 
be "substantially identical." This definition also refers to, or may be applied to, the 
complement of a test sequence. The definition also includes sequences that have deletions 
10 and/or insertions, substitutions, and naturally occurring, e.g., polymorphic or allelic variants, 
and man-made variants. As described below, the preferred algorithms can account for gaps 
and the like. Preferably, identity exists over a region that is at least about 25 amino acids or 
nucleotides in length, or more preferably over a region that is 50-100 amino acids or 
nucleotides in length. 

1 5 For sequence comparison, typically one sequence acts as a reference sequence, to 

which test sequences are compared. When using a sequence comparison algorithm, test and 
reference sequences are entered into a computer, subsequence coordinates are designated, if 
necessary, and sequence algorithm program parameters are designated. Preferably, default 
program parameters can be used, or alternative parameters can be designated. The sequence 

20 comparison algorithm then calculates the percent sequence identities for the test sequences 
relative to the reference sequence, based on the program parameters. 

A "comparison window", as used herein, includes reference to a segment of 
contiguous positions selected from the group consisting typically of from 20 to 600, usually 
about 50 to about 200, more usually about 100 to about 150 in which a sequence may be 

25 compared to a reference sequence of the same number of contiguous positions after the two 
sequences are optimally aligned. Methods of alignment of sequences for comparison are 
well-known in the art. Optimal alignment of sequences for comparison can be conducted, 
e.g., by the local homology algorithm of Smith and Waterman (1981) Adv. AppI. Math. 
2:482, by the homology alignment algorithm of Needleman and Wunsch (1970) J. Mol. Biol. 

30 48:443, by the search for similarity method of Pearson and Lipman (1988) Proc. Nat'l. Acad. 
Sci. USA 85:2444, by computerized implementations of these algorithms (GAP, BESTFIT, 
FASTA, and TFASTA in the Wisconsin Genetics Software Package, Genetics Computer 
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Group, 575 Science Dr., Madison, WI), or by manual alignment and visual inspection (see, 
e.g., Ausubel, et al. (eds. 1995 and supplements) Current Protocols in Molecular Biology . 

Preferred examples of algorithms that are suitable for determining percent sequence 
identity and sequence similarity include the BLAST and BLAST 2.0 algorithms, which are 
5 described in Altschul, et al. (1977) Nuc. Acids Res. 25:3389-3402 and Altschul, et al. (1990) 
J. Mol. Biol. 215:403-410. BLAST and BLAST 2.0 are used, with the parameters described 
herein, to determine percent sequence identity for the nucleic acids and proteins of the 
invention. Software for performing BLAST analyses is publicly available through the 
National Center for Biotechnology Information (http://www.ncbi.nlm.nih.gov/). This 

1 0 algorithm involves first identifying high scoring sequence pairs (HSPs) by identifying short 
words of length W in the query sequence, which either match or satisfy some positive-valued 
threshold score T when aligned with a word of the same length in a database sequence. T is 
referred to as the neighborhood word score threshold (Altschul, et al., supra). These initial 
neighborhood word hits act as seeds for initiating searches to find longer HSPs containing 

1 5 them. The word hits are extended in both directions along each sequence for as far as the 
cumulative alignment score can be increased. Cumulative scores are calculated using, e.g., 
for nucleotide sequences, the parameters M (reward score for a pair of matching residues; 
always > 0) and N (penalty score for mismatching residues; always < 0). For amino acid 
sequences, a scoring matrix is used to calculate the cumulative score. Extension of the word 

20 hits in each direction are halted when: the cumulative alignment score falls off by the 

quantity X from its maximum achieved value; the cumulative score goes to zero or below, 
due to the accumulation of one or more negative-scoring residue alignments; or the end of 
either sequence is reached. The BLAST algorithm parameters W, T, and X determine the 
sensitivity and speed of the alignment. The BLASTN program (for nucleotide sequences) 

25 uses as defaults a wordlength (W) of 1 1, an expectation (E) of 10, M=5, N— 4 and a 
comparison of both strands. For amino acid sequences, the BLASTP program uses as 
defaults a wordlength of 3, and expectation (E) of 10, and the BLOSUM62 scoring matrix 
(see Henikoff and Henikoff (1989) Proc. Natl. Acad. Sci. USA 89:10915) alignments (B) of 
50, expectation (E) of 10, M=5, N— 4, and a comparison of both strands. 

30 The BLAST algorithm also performs a statistical analysis of the similarity between 

two sequences (see, e.g., Karlin and Altschul (1993) Proc. Naf 1. Acad. Sci. USA 90:5873- 
5787). One measure of similarity provided by the BLAST algorithm is the smallest sum 
probability (P(N)), which provides an indication of the probability by which a match between 
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two nucleotide or amino acid sequences would occur by chance. For example, a nucleic acid 
is considered similar to a reference sequence if the smallest sum probability in a comparison 
of the test nucleic acid to the reference nucleic acid is less than about 0.2, more preferably 
less than about 0.01, and most preferably less than about 0.001. Log values may be negative 
5 large numbers, e.g., 5, 10, 20, 30, 40, 40, 70, 90, 1 10, 150, 170, etc. 

An indication that two nucleic acid sequences are substantially identical is that the 
polypeptide encoded by the first nucleic acid is immunologically cross reactive with the 
antibodies raised against the polypeptide encoded by the second nucleic acid. Thus, a 
polypeptide is typically substantially identical to a second polypeptide, e.g., where the two 
10 peptides differ only by conservative substitutions. Another indication that two nucleic acid 
sequences are substantially identical is that the two molecules or their complements hybridize 
to each other under stringent conditions. Yet another indication that two nucleic acid 
sequences are substantially identical is that the same primers can be used to amplify the 
sequences. 

15 A "host cell" is a naturally occurring cell or a transformed cell that contains an 

expression vector and supports the replication or expression of the expression vector. Host 
cells may be cultured cells, explants, cells in vivo, and the like. Host cells may be 
prokaryotic cells such as E. coli, or eukaryotic cells such as yeast, insect, amphibian, or 
mammalian cells such as CHO, HeLa, and the like (see, e.g., the American Type Culture 

20 Collection catalog or web site, www.atcc.org). 

The terms "isolated," "purified," or "biologically pure" refer to material that is 
substantially or essentially free from components that normally accompany it as found in its 
native state. Purity and homogeneity are typically determined using analytical chemistry 
techniques such as polyacrylamide gel electrophoresis or high performance liquid 

25 chromatography. A protein or nucleic acid that is the predominant species present in a 

preparation is substantially purified. In particular, an isolated nucleic acid is separated from 
some open reading frames that naturally flank the gene and encode proteins other than protein 
encoded by the gene. The term "purified" in some embodiments denotes that a nucleic acid 
or protein gives rise to essentially one band in an electrophoretic gel. Preferably, it means 

30 that the nucleic acid or protein is at least about 85% pure, more preferably at least 95% pure, 
and most preferably at least 99% pure. "Purify" or "purification" in other embodiments 
means removing at least one contaminant or component from the composition to be purified. 
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In this sense, purification does not require that the purified compound be homogeneous, e.g., 
100% pure. 

The terms "polypeptide," "peptide" and "protein" are used interchangeably herein to 
refer to a polymer of amino acid residues. The terms apply to amino acid polymers in which 
5 one or more amino acid residue is an artificial chemical mimetic of a corresponding naturally 
occurring amino acid, as well as to naturally occurring amino acid polymers, those containing 
modified residues, and non-naturally occurring amino acid polymer. 

The term "amino acid" refers to naturally occurring and synthetic amino acids, as well 
as amino acid analogs and amino acid mimetics that function similarly to the naturally 

10 occurring amino acids. Naturally occurring amino acids are those encoded by the genetic 
code, as well as those amino acids that are later modified, e.g., hydroxyproline, y- 
carboxyglutamate, and O-phosphoserine. Amino acid analogs refer to compounds that have 
the same basic chemical structure as a naturally occurring amino acid, e.g., an a carbon that is 
bound to a hydrogen, a carboxyl group, an amino group, and an R group, e.g., homo serine, 

15 norleucine, methionine sulfoxide, methionine methyl sulfonium. Such analogs may have 
modified R groups (e.g., norleucine) or modified peptide backbones, but retain some basic 
chemical structure as a naturally occurring amino acid. Amino acid mimetics refer to 
chemical compounds that have a structure that is different from the general chemical 
structure of an amino acid, but that function similarly to another amino acid. 

20 Amino acids may be referred to herein by either their commonly known three letter 

symbols or by the one-letter symbols recommended by the IUPAC-IUB Biochemical 
Nomenclature Commission. Nucleotides, likewise, may be referred to by their commonly 
accepted single-letter codes. 

"Conservatively modified variants" applies to both amino acid and nucleic acid 

25 sequences. With respect to particular nucleic acid sequences, conservatively modified 

variants refers to those nucleic acids which encode identical or essentially identical amino 
acid sequences, or where the nucleic acid does not encode an amino acid sequence, to 
essentially identical or associated, e.g., naturally contiguous, sequences. Because of the 
degeneracy of the genetic code, a large number of functionally identical nucleic acids encode 

30 most proteins. For instance, the codons GCA, GCC, GCG, and GCU each encode the amino 
acid alanine. Thus, at each position where an alanine is specified by a codon, the codon can 
be altered to another of the corresponding codons described without altering the encoded 
polypeptide. Such nucleic acid variations are "silent variations," which are one species of 

13 
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conservatively modified variations. Every nucleic acid sequence herein which encodes a 
polypeptide also describes silent variations of the nucleic acid. In certain contexts each 
codon in a nucleic acid (except AUG, which is ordinarily the only codon for methionine, and 
TGG, which is ordinarily the only codon for tryptophan) can be modified to yield a 
5 functionally similar molecule. Accordingly, a silent variation of a nucleic acid which 
encodes a polypeptide is implicit in a described sequence with respect to the expression 
product, but not necessarily with respect to actual probe sequences. 

As to amino acid sequences, one of skill will recognize that individual substitutions, 
deletions or additions to a nucleic acid, peptide, polypeptide, or protein sequence which 

1 0 alters, adds or deletes a single amino acid or a small percentage of amino acids in the encoded 
sequence is a "conservatively modified variant" where the alteration results in the substitution 
of an amino acid with a chemically similar amino acid. Conservative substitution tables 
providing functionally similar amino acids are well known in the art. Such conservatively 
modified variants are in addition to and do not exclude polymorphic variants, interspecies 

15 homologs, and alleles of the invention. Typically conservative substitutions include for one 
another: 1) Alanine (A), Glycine (G); 2) Aspartic acid (D), Glutamic acid (E); 3) Asparagine 
(N), Glutamine (Q); 4) Arginine (R), Lysine (K); 5) Isoleucine (I), Leucine (L), Methionine 
(M), Valine (V); 6) Phenylalanine (F), Tyrosine (Y), Tryptophan (W); 7) Serine (S), 
Threonine (T); and 8) Cysteine (C), Methionine (M) (see, e.g., Creighton, Proteins (1984)). 

20 Macromolecular structures such as polypeptide structures can be described in terms of 

various levels of organization. For a general discussion of this organization, see, e.g., 
Alberts, et al. (1994) Molecular Biology of the Cell (3 rd ed.) and Cantor and Schimmel (1980) 
Biophysical Chemistry Part I: The Conformation of Biological Macromolecules . "Primary 
structure" refers to the amino acid sequence of a particular peptide. "Secondary structure" 

25 refers to locally ordered, three dimensional structures within a polypeptide. These structures 
are commonly known as domains. Domains are portions of a polypeptide that often form a 
compact unit of the polypeptide and are typically 25 to approximately 500 amino acids long. 
Typical domains are made up of sections of lesser organization such as stretches of P-sheet 
and oc-helices. "Tertiary structure" refers to the complete three dimensional structure of a 

30 polypeptide monomer. "Quaternary structure" refers to the three dimensional structure 
formed, usually by the noncovalent association of independent tertiary units. Anisotropic 
terms are also known as energy terms. 
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"Nucleic acid" or "oligonucleotide" or "polynucleotide" or grammatical equivalents 
used herein means at least two nucleotides covalently linked together. Oligonucleotides are 
typically from about 5, 6, 7, 8, 9, 10, 12, 15, 25, 30, 40, 50 or more nucleotides in length, up 
to about 100 nucleotides in length. Nucleic acids and polynucleotides are a polymers of any 
5 length, including longer lengths, e.g., 200, 300, 500, 1000, 2000, 3000, 5000, 7000, 10,000, 
etc. A nucleic acid of the present invention will generally contain phosphodiester bonds, 
although in some cases, nucleic acid analogs are included that may have at least one different 
linkage, e.g., phosphoramidate, phosphorothioate, phosphorodithioate, or O- 
methylphophoroamidite linkages (see Eckstein (1992) Oligonucleotides and Analogues: A 

10 Practical Approach Oxford University Press); and peptide nucleic acid backbones and 
linkages. Other analog nucleic acids include those with positive backbones; non-ionic 
backbones, and non-ribose backbones, including those described in U.S. Patent Nos. 
5,235,033 and 5,034,506, and Chapters 6 and 7, in Sanghui and Cook, eds. Carbohydrate 
Modifications in Antisense Research . ASC Symposium Series 580. Nucleic acids containing 

15 one or more carbocyclic sugars are also included within one definition of nucleic acids. 

Modifications of the ribose-phosphate backbone may be done for a variety of reasons, e.g., to 
increase the stability and half-life of such molecules in physiological environments or as 
probes on a biochip. Mixtures of naturally occurring nucleic acids and analogs can be made; 
alternatively, mixtures of different nucleic acid analogs, and mixtures of naturally occurring 

20 nucleic acids and analogs may be made. 

Particularly preferred are peptide nucleic acids (PNA) which includes peptide nucleic 
acid analogs. These backbones are substantially non-ionic under neutral conditions, in 
contrast to the highly charged phosphodiester backbone of naturally occurring nucleic acids. 
This results in two advantages. First, the PNA backbone exhibits improved hybridization 

25 kinetics. PNAs have larger changes in the melting temperature (T m ) for mismatched versus 
perfectly matched basepairs. DNA and RNA typically exhibit a 2-4° C drop in T m for an 
internal mismatch. With the non-ionic PNA backbone, the drop is closer to 7-9° C. 
Similarly, due to their non-ionic nature, hybridization of the bases attached to these 
backbones is relatively insensitive to salt concentration. In addition, PNAs are not degraded 

30 by cellular enzymes, and thus can be more stable. 

The nucleic acids may be single stranded or double stranded, as specified, or contain 
portions of both double stranded or single stranded sequence. As will be appreciated by those 
in the art, the depiction of a single strand also defines the sequence of the complementary 

15 
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strand; thus the sequences described herein also provide the complement of the sequence. 
The nucleic acid may be DNA, both genomic and cDNA, RNA, or a hybrid, where the 
nucleic acid may contain combinations of deoxyribo- and ribo-nucleotides, and combinations 
of bases, including uracil, adenine, thymine, cytosine, guanine, inosine, xanthine 
5 hypoxanthine, isocytosine, isoguanine, etc. "Transcript" typically refers to a naturally 
occurring RNA, e.g., a pre-mRNA, hnRNA, or mRNA. As used herein, the term 
"nucleoside" includes nucleotides and nucleoside and nucleotide analogs, and modified 
nucleosides such as amino modified nucleosides. In addition, "nucleoside" includes non- 
naturally occurring analog structures. Thus, e.g., the individual units of a peptide nucleic 

10 acid, each containing a base, are referred to herein as a nucleoside. 

A "label" or a "detectable moiety" is a composition detectable by spectroscopic, 
photochemical, biochemical, immunochemical, physiological, chemical, or other physical 
means. For example, useful labels include 32 P, fluorescent dyes, electron-dense reagents, 
enzymes (e.g., as commonly used in an ELISA), biotin, digoxigenin, or haptens and proteins 

15 or other entities which can be made detectable, e.g., by incorporating a radiolabel into the 

peptide or used to detect antibodies specifically reactive with the peptide. The labels may be 
incorporated into the cancer nucleic acids, proteins, and antibodies. Many methods known in 
the art for conjugating the antibody to the label may be employed, including those methods 
described by Hunter, et al. (1962) Nature 144:945; David, et al. (1974) Biochemistry 

20 13:1014-1021; Pain, et al. f!98n J. Immunol. Meth. , 40:219-230; and Nygren (1982) JL 
Histochem. and Cvtochem. 30:407-412. 

An "effector" or "effector moiety" or "effector component" is a molecule that is 
bound (or linked, or conjugated), either covalently, through a linker or a chemical bond, or 
noncovalently, through ionic, van der Waals, electrostatic, or hydrogen bonds, to an antibody. 

25 The "effector" can be a variety of molecules including, e.g., detection moieties including 

radioactive compounds, fluorescent compounds, an enzyme or substrate, tags such as epitope 
tags, a toxin; activatable moieties, a chemotherapeutic agent; a lipase; an antibiotic; or a 
radioisotope emitting "hard" e.g., beta radiation. 

A "labeled nucleic acid probe or oligonucleotide" is one that is bound, either 

30 covalently, through a linker or a chemical bond, or noncovalently, through ionic, van der 

Waals, electrostatic, or hydrogen bonds to a label such that the presence of the probe may be 
detected by detecting the presence of the label bound to the probe. Alternatively, method 
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using high affinity interactions may achieve the same results where one of a pair of binding 
partners binds to the other, e.g., biotin, streptavidin. 

As used herein a "nucleic acid probe or oligonucleotide" is a nucleic acid capable of 
binding to a target nucleic acid of complementary sequence through one or more types of 
5 chemical bonds, usually through complementary base pairing, e.g., through hydrogen bond 
formation. As used herein, a probe may include natural (i.e., A, G, C, or T) or modified bases 
(7-deazaguanosine, inosine, etc.). In addition, the bases in a probe may be joined by a 
linkage other than a phosphodiester bond, preferably one that does not functionally interfere 
with hybridization. Thus, e.g., probes may be peptide nucleic acids in which the constituent 

10 bases are joined by peptide bonds rather than phosphodiester linkages. Probes may bind 

target sequences lacking complete complementarity with the probe sequence depending upon 
the stringency of the hybridization conditions. The probes are preferably directly labeled, 
e.g., with isotopes, chromophores, lumiphores, chromogens, or indirectly labeled, e.g., with 
biotin to which a streptavidin complex may later bind. By assaying for the presence or 

15 absence of the probe, one can detect the presence or absence of the select sequence or 

subsequence. Diagnosis or prognosis may be based at the genomic level, or at the level of 
RNA or protein expression. 

The term "recombinant" when used with reference, e.g., to a cell, or nucleic acid, 
protein, or vector, indicates that the cell, nucleic acid, protein or vector, has been modified by 

20 the introduction of a heterologous nucleic acid or protein or the alteration of a native nucleic 
acid or protein, or that the cell is derived from a cell so modified. Thus, e.g., recombinant 
cells express genes that are not found within the native (non-recombinant) form of the cell or 
express native genes that are otherwise abnormally expressed, under expressed or not 
expressed at all. By the term "recombinant nucleic acid" herein is meant nucleic acid, 

25 originally formed in vitro, in general, by the manipulation of nucleic acid, e.g., using 

polymerases and endonucleases, in a form not normally found in nature. In this manner, 
operably linkage of different sequences is achieved. Thus an isolated nucleic acid, in a linear 
form, or an expression vector formed in vitro by ligating DNA molecules that are not 
normally joined, are both considered recombinant for the purposes of this invention. It is 

30 understood that once a recombinant nucleic acid is made and reintroduced into a host cell or 
organism, it will replicate non-recombinantly, i.e., using the in vivo cellular machinery of the 
host cell rather than in vitro manipulations; however, such nucleic acids, once produced 
recombinantly, although subsequently replicated non-recombinantly, are still considered 
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recombinant for the purposes of the invention. Similarly, a "recombinant protein" is a protein 
made using recombinant techniques, i.e., through the expression of a recombinant nucleic 
acid as depicted above. 

The term "heterologous" when used with reference to portions of a nucleic acid 
5 indicates that the nucleic acid comprises two or more subsequences that are not normally 
found in the same relationship to each other in nature. For instance, the nucleic acid is 
typically recombinantly produced, having two or more sequences, e.g., from unrelated genes 
arranged to make a new functional nucleic acid, e.g., a promoter from one source and a 
coding region from another source. Similarly, a heterologous protein will often refer to two 
10 or more subsequences that are not found in the same relationship to each other in nature (e.g., 
a fusion protein). 

A "promoter" is typically an array of nucleic acid control sequences that direct 
transcription of a nucleic acid. As used herein, a promoter includes necessary nucleic acid 
sequences near the start site of transcription, such as, in the case of a polymerase II type 

15 promoter, a TATA element. A promoter also optionally includes distal enhancer or repressor 
elements, which can be located as much as several thousand base pairs from the start site of 
transcription. A "constitutive" promoter is a promoter that is active under most 
environmental and developmental conditions. An "inducible" promoter is a promoter that is 
active under environmental or developmental regulation. The term "operably linked" refers 

20 to a functional linkage between a nucleic acid expression control sequence (such as a 

promoter, or array of transcription factor binding sites) and a second nucleic acid sequence, 
e.g., wherein the expression control sequence directs transcription of the nucleic acid 
corresponding to the second sequence. 

An "expression vector" is a nucleic acid construct, generated recombinantly or 

25 synthetically, with a series of specified nucleic acid elements that permit transcription of a 

particular nucleic acid in a host cell. The expression vector can be part of a plasmid, virus, or 
nucleic acid fragment. Typically, the expression vector includes a nucleic acid to be 
transcribed in operable linkage to a promoter. 

The phrase "selectively (or specifically) hybridizes to" refers to the binding, 

30 duplexing, or hybridizing of a molecule selectively to a particular nucleotide sequence under 
stringent hybridization conditions when that sequence is present in a complex mixture (e.g., 
total cellular or library DNA or RNA). 
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The phrase "stringent hybridization conditions" refers to conditions under which a 
probe will hybridize to its target subsequence, typically in a complex mixture of nucleic 
acids, but to essentially no other sequences. Stringent conditions are sequence-dependent and 
will be different in different circumstances. Longer sequences hybridize specifically at 
5 higher temperatures. An extensive guide to the hybridization of nucleic acids is found in 
"Overview of principles of hybridization and the strategy of nucleic acid assays" in Tijssen 
(1993) Techniques in Biochemistry and Molecular Biology— Hybridization with Nucleic 
Probes (vol. 24) Elsevier. Generally, stringent conditions are selected to be about 5-10° C 
lower than the thermal melting point (T m ) for the specific sequence at a defined ionic strength 

1 0 pH. The T m is the temperature (under defined ionic strength, pH, and nucleic concentration) 
at which 50% of the probes complementary to the target hybridize to the target sequence at 
equilibrium (as the target sequences are present in excess, at T m , 50% of the probes are 
occupied at equilibrium). Stringent conditions will be those in which the salt concentration is 
less than about 1.0 M sodium ion, typically about 0.01 to 1.0 M sodium ion concentration (or 

15 other salts) at pH 7.0 to 8.3 and the temperature is at least about 30° C for short probes (e.g., 
10 to 50 nucleotides) and at least about 60° C for long probes (e.g., greater than 50 
nucleotides). Stringent conditions may also be achieved with the addition of destabilizing 
agents such as formamide. For selective or specific hybridization, a positive signal is 
typically at least two times background, preferably 1 0 times background hybridization. 

20 Exemplary stringent hybridization conditions are often: 50% formamide, 5x SSC, and 1% 
SDS, incubating at 42° C, or, 5x SSC, 1% SDS, incubating at 65° C, with wash in 0.2x SSC, 
and 0.1% SDS at 65° C. For PCR, a temperature of about 36° C is typical for low stringency 
amplification, although annealing temperatures may vary between about 32° C and 48° C 
depending on primer length. For high stringency PCR amplification, a temperature of about 

25 62° C is typical, although high stringency annealing temperatures can range from about 50° C 
to about 65° C, depending on the primer length and specificity. Typical cycle conditions for 
both high and low stringency amplifications include a denaturation phase of 90° C - 95° C for 
0.5 - 2 min., an annealing phase lasting 0.5 - 2 min., and an extension phase of about 72° C 
for 1 - 2 min. Protocols and guidelines for low and high stringency amplification reactions 

30 are provided, e.g., in Innis, et al.(1990) PCR Protocols, A Guide to Methods and 
A pplications . 

Nucleic acids that do not hybridize to each other under stringent conditions are still 
substantially identical if the polypeptides which they encode are substantially identical. This 
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occurs, e.g., when a copy of a nucleic acid is created using the maximum codon degeneracy 
permitted by the genetic code. In such cases, the nucleic acids typically hybridize under 
moderately stringent hybridization conditions. Exemplary "moderately stringent 
hybridization conditions" include a hybridization in a buffer of 40% formamide, 1 M NaCl, 
5 1% SDS at 37° C, and a wash in IX SSC at 45° C. A positive hybridization is at least twice 
background. Alternative hybridization and wash conditions can be utilized to provide 
conditions of similar stringency. Additional guidelines for determining hybridization 
parameters are provided in numerous reference, e.g., Ausubel, et al. (ed.) Current Protocols in 
Molecular Biology Lippincott. 

10 The phrase "functional effects" in the context of assays for testing compounds that 

modulate activity of a lung cancer protein includes the determination of a parameter that is 
indirectly or directly under the influence of the lung cancer protein or nucleic acid, e.g., a 
physiological, enzymatic, functional, physical, or chemical effect, such as the ability to 
decrease lung cancer. It includes ligand binding activity; cell viability, cell growth on soft 

1 5 agar; anchorage dependence; contact inhibition and density limitation of growth; cellular 
proliferation; cellular transformation; growth factor or serum dependence; tumor specific 
marker levels; invasiveness into Matrigel; tumor growth and metastasis in vivo; mRNA and 
protein expression in cells undergoing metastasis, and other characteristics of lung cancer 
cells. "Functional effects" include in vitro, in vivo, and ex vivo activities. 

20 By "determining the functional effect" is meant assaying for a compound that 

increases or decreases a parameter that is indirectly or directly under the influence of a lung 
cancer protein sequence, e.g., physiological, functional, enzymatic, physical, or chemical 
effects. Such functional effects can be measured by many means known to those skilled in 
the art, e.g., changes in spectroscopic characteristics (e.g., fluorescence, absorbance, 

25 refractive index), hydrodynamic (e.g., shape), chromatographic, or solubility properties for 
the protein, measuring inducible markers or transcriptional activation of the lung cancer 
protein; measuring binding activity or binding assays, e.g., binding to antibodies or other 
ligands, and measuring cellular proliferation. Determination of the functional effect of a 
compound on lung cancer can also be performed using lung cancer assays known to those of 

30 skill in the art such as an in vitro assays, e.g., cell growth on soft agar; anchorage 

dependence; contact inhibition and density limitation of growth; cellular proliferation; 
cellular transformation; growth factor or serum dependence; tumor specific marker levels; 
invasiveness into Matrigel; tumor growth and metastasis in vivo; mRNA and protein 

20 
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expression in cells undergoing metastasis, and other characteristics of lung cancer cells. The 
functional effects can be evaluated by many means known to those skilled in the art, e.g., 
microscopy for quantitative or qualitative measures of alterations in morphological features, 
measurement of changes in RNA or protein levels for lung cancer-associated sequences, 
5 measurement of RNA stability, identification of downstream or reporter gene expression 
(CAT, luciferase, p-gal, GFP, and the like), e.g., via chemiluminescence, fluorescence, 
colorimetric reactions, antibody binding, inducible markers, and ligand binding assays. 

"Inhibitors", "activators", and "modulators" of lung cancer polynucleotide and 
polypeptide sequences are used to refer to activating, inhibitory, or modulating molecules or 

10 compounds identified using in vitro and in vivo assays of lung cancer polynucleotide and 

polypeptide sequences. Inhibitors are compounds that, e.g., bind to, partially or totally block 
activity, decrease, prevent, delay activation, inactivate, desensitize, or down regulate the 
activity or expression of lung cancer proteins, e.g., antagonists. Antisense or inhibitory 
nucleic acids may seem to inhibit expression and subsequent function of the protein. 

15 "Activators" are compounds that increase, open, activate, facilitate, enhance activation, 
sensitize, agonize, or up regulate lung cancer protein activity. Inhibitors, activators, or 
modulators also include genetically modified versions of lung cancer proteins, e.g., versions 
with altered activity, as well as naturally occurring and synthetic ligands, antagonists, 
agonists, antibodies, small chemical molecules and the like. Such assays for inhibitors and 

20 activators include, e.g., expressing the lung cancer protein in vitro, in cells, or cell 

membranes, applying putative modulator compounds, and then determining the functional 
effects on activity, as described above. Activators and inhibitors of lung cancer can also be 
identified by incubating lung cancer cells with the test compound and determining increases 
or decreases in the expression of 1 or more lung cancer proteins, e.g., 1, 2, 3, 4, 5, 10, 15, 20, 

25 25, 30, 40, 50 or more lung cancer proteins, such as lung cancer proteins encoded by the 
sequences set out in Tables 1A-16. 

Samples or assays comprising lung cancer proteins that are treated with a potential 
activator, inhibitor, or modulator are compared to control samples without the inhibitor, 
activator, or modulator to examine the extent of inhibition. Control samples (untreated with 

30 inhibitors) are assigned a relative protein activity value of 1 00%. Inhibition of a polypeptide 
is achieved when the activity value relative to the control is about 80%, preferably 50%, more 
preferably 25-0%. Activation of a lung cancer polypeptide is achieved when the activity 
value relative to the control (untreated with activators) is 1 10%, more preferably 150%, more 
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preferably 200-500% (i.e., two to five fold higher relative to the control), more preferably 
1000-3000% higher. 

The phrase "changes in cell growth" refers to any change in cell growth and 
proliferation characteristics in vitro or in vivo, such as cell viability, formation of foci, 
5 anchorage independence, semi-solid or soft agar growth, changes in contact inhibition and 
density limitation of growth, loss of growth factor or serum requirements, changes in cell 
morphology, gaining or losing immortalization, gaining or losing tumor specific markers, 
ability to form or suppress tumors when injected into suitable animal hosts, and/or 
immortalization of the cell. See, e.g., Freshney (1994) Culture of Animal Cells a Manual of 

10 Basic Technique pp. 231-241 (3 rd ed.). 

"Tumor cell" refers to precancerous, cancerous, and normal cells in a tumor. 
"Cancer cells," "transformed" cells, or "transformation" in tissue culture, refers to 
spontaneous or induced phenotypic changes that do not necessarily involve the uptake of new 
genetic material. Although transformation can arise from infection with a transforming virus 

15 and incorporation of new genomic DNA, or uptake of exogenous DNA, it can also arise 

spontaneously or following exposure to a carcinogen, thereby mutating an endogenous gene. 
Transformation is associated with phenotypic changes, such as immortalization of cells, 
aberrant growth control, nonmorphological changes, and/or malignancy (see, Freshney 
(1994) Culture of Animal Cells a Manual of Basic Technique (3 rd ed.)). 

20 "Antibody" refers to a polypeptide comprising a framework region from an 

immunoglobulin gene or fragments thereof that specifically binds and recognizes an antigen. 
The recognized immunoglobulin genes include the kappa, lambda, alpha, gamma, delta, 
epsilon, and mu constant region genes, as well as the myriad immunoglobulin variable region 
genes. Light chains are classified as either kappa or lambda. Heavy chains are classified as 

25 gamma, mu, alpha, delta, or epsilon, which in turn define the immunoglobulin classes, IgG, 
IgM, IgA, IgD, and IgE, respectively. Typically, the antigen-binding region of an antibody or 
its functional equivalent will be most critical in specificity and affinity of binding. See Paul, 
Fundamental Immunology . 

An exemplary immunoglobulin (antibody) structural unit comprises a tetramer. Each 

30 tetramer is composed of two identical pairs of polypeptide chains, each pair having one 
"light" (about 25 kD) and one "heavy" chain (about 50-70 kD). The N-terminus of each 
chain defines a variable region of about 100 to 110 or more amino acids primarily responsible 
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for antigen recognition. The terms variable light chain (V L ) and variable heavy chain (V H ) 
refer to these light and heavy chains respectively. 

Antibodies exist, e.g., as intact immunoglobulins or as a number of well-characterized 
fragments produced by digestion with various peptidases. Thus, e.g., pepsin digests an 
5 antibody below the disulfide linkages in the hinge region to produce F(ab)' 2 , a dimer of Fab 
which itself is a light chain joined to V H -C H 1 by a disulfide bond. The F(ab)' 2 may be 
reduced under mild conditions to break the disulfide linkage in the hinge region, thereby 
converting the F(ab)' 2 dimer into an Fab' monomer. The Fab 5 monomer is essentially Fab 
with part of the hinge region (see Paul (ed. 1999) Fundamental Immunology (4th ed.). While 

10 various antibody fragments are defined in terms of the digestion of an intact antibody, one of 
skill will appreciate that such fragments may be synthesized de novo either chemically or by 
using recombinant DNA methodology. Thus, the term antibody, as used herein, also includes 
antibody fragments either produced by the modification of whole antibodies, or those 
synthesized de novo using recombinant DNA methodologies (e.g., single chain Fv) or those 

15 identified using phage display libraries (see, e.g., McCafferty, et al. (1990) Nature 348:552- 
554). 

For preparation of antibodies, e.g., recombinant, monoclonal, or polyclonal 
antibodies, many technique known in the art can be used (see, e.g., Kohler and Milstein 
(1975) Nature 256:495-497; Kozbor, et al. (1983) Immunology Today 4:72; Cole, et al. 

20 (1985), pp. 77-96 in Monoclonal Antibodies and Cancer Therapy : Coligan (1991 and 

supplements) Current Protocols in Immunology : Harlow and Lane (1988) Antibodies. A 
Laboratory Manual : and Goding (1986) Monoclonal Antibodies: Principles and Practice (2d 
ed.)). Techniques for the production of single chain antibodies (U.S. Patent 4,946,778) can 
be adapted to produce antibodies to polypeptides of this invention. Also, transgenic mice, or 

25 other organisms such as other mammals, may be used to express humanized antibodies. 

Alternatively, phage display technology can be used to identify antibodies and heteromeric 
Fab fragments that specifically bind to selected antigens (see, e.g., McCafferty, et al. (1990) 
Nature 348:552-554; Marks, et al. (1992) Biotechnology 10:779-783). 

A "chimeric antibody" is an antibody molecule in which, e.g, (a) the constant region, 

30 or a portion thereof, is altered, replaced, or exchanged so that the antigen binding site 
(variable region) is linked to a constant region of a different or altered class, effector 
function, and/or species, or an entirely different molecule which confers new properties to the 
chimeric antibody, e.g., an enzyme, toxin, hormone, growth factor, drug, etc.; or (b) the 



23 



WO 02/086443 PCT/US02/12476 

variable region, or a portion thereof, is altered, replaced, or exchanged with a variable region 
having a different or altered antigen specificity. 



Identification of lnng cancer-associated sequences 

5 In one aspect, the expression levels of genes are determined in different patient 

samples for which diagnosis information is desired, to provide expression profiles. An 
expression profile of a particular sample is essentially a "fingerprint" of the state of the 
sample; while two states may have any particular gene similarly expressed, the evaluation of 
a number of genes simultaneously allows the generation of a gene expression profile that is 

10 characteristic of the state of the cell. That is, normal tissue may be distinguished from 
cancerous or metastatic cancerous tissue, or metastatic cancerous tissue can be compared 
with tissue from surviving cancer patients. By comparing expression profiles of tissue in 
known different lung cancer states, information regarding which genes are important 
(including both up- and down-regulation of genes) in each of these states is obtained. 

15 Molecular profiling may distinguish subtypes of a currently collective disease designation, 
e.g., different forms of lung cancer (chronic disease, adenocarcinoma, etc.) 

The identification of sequences that are differentially expressed in lung cancer versus 
non-lung cancer tissue allows the use of this information in a number of ways. For example, 
a particular treatment regime may be evaluated: does a chemo therap eutic drug act to down- 

20 regulate lung cancer, and thus tumor growth or recurrence, in a particular patient. 

Alternatively, a treatment step may induce other markers which may be used as targets to 
destroy tumor cells. Similarly, diagnosis and treatment outcomes may be done or confirmed 
by comparing patient samples with the known expression profiles. Malignant diseasemay be 
compared to non-malignant conditions. Metastatic tissue can also be analyzed to determine 

25 the stage of lung cancer in the tissue, or origin of primary tumor, e.g., metastasis from a 

remote primary site. Furthermore, these gene expression profiles (or individual genes) allow 
screening of drug candidates with an eye to mimicking or altering a particular expression 
profile; e.g., screening can be done for drugs that suppress the lung cancer expression profile. 
This may be done by making biochips comprising sets of the important lung cancer genes, 

30 which can then be used in these screens. PCR methods may be applied with selected primer 
pairs, and analysis may be of RNA or of genomic sequences. These methods can also be 
done on the protein basis; that is, protein expression levels of the lung cancer proteins can be 
evaluated for diagnostic purposes or to screen candidate agents. In addition, the lung cancer 
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nucleic acid sequences can be administered for gene therapy purposes, including the 
administration of antisense nucleic acids, or the lung cancer proteins (including antibodies 
and other modulators thereof) administered as therapeutic drugs or as protein or DNA 
vaccines. 

5 Thus the present invention provides nucleic acid and protein sequences that are 

differentially expressed in lung cancer relative to normal tissues and/or non-malignant lung 
disease, or in different types of lung disease, herein termed "lung cancer sequences." As 
outlined below, lung cancer sequences include those that are up-regulated (i.e., expressed at a 
higher level) in lung cancer, as well as those that are down-regulated (i.e., expressed at a 

10 lower level). In a preferred embodiment, the lung cancer sequences are from humans; 
however, as will be appreciated by those in the art, lung cancer sequences from other 
organisms may be useful in animal models of disease and drug evaluation; thus, other lung 
cancer sequences are provided, from vertebrates, including mammals, including rodents (rats, 
mice, hamsters, guinea pigs, etc.), primates, farm animals (including sheep, goats, pigs, cows, 

1 5 horses, etc.) and pets (dogs, cats, etc.). Lung cancer sequences from other organisms may be 
obtained using the techniques outlined below. 

Lung cancer sequences can include both nucleic acid and amino acid sequences. As 
will be appreciated by those in the art and is more fully outlined below, lung cancer nucleic 
acid sequences are useful in a variety of applications, including diagnostic applications, 

20 which will detect naturally occurring nucleic acids, as well as screening applications; e.g., 
biochips comprising nucleic acid probes or PGR microtiter plates with selected probes to the 
lung cancer sequences can be generated. 

A lung cancer sequence can be initially identified by substantial nucleic acid and/or 
amino acid sequence homology to the lung cancer sequences outlined herein. Such 

25 homology can be based upon the overall nucleic acid or amino acid sequence, and is 

generally determined as outlined below, e.g., using homology programs or hybridization 
conditions. 

For identifying lung cancer-associated sequences, the lung cancer screen typically 
includes comparing genes identified in different tissues, e.g., normal and cancerous tissues, 
30 cancer and non-malignant conditions, non-malignant conditions and normal tissues, or tumor 
tissue samples from patients who have metastatic disease vs. non metastatic tissue. Other 
suitable tissue comparisons include comparing lung cancer samples with metastatic cancer 
samples from other cancers, such as, breast, other gastrointestinal cancers, prostate, ovarian, 
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etc. Samples of, non metastatic disease tissue and tissue undergoing metastasis are applied to 
biochips comprising nucleic acid probes. The samples are first microdissected, if applicable, 
and treated as is known in the art for the preparation of mRNA. Suitable biochips are 
commercially available, e.g., from Affymetrix, Santa Clara, CA. Gene expression profiles as 
5 described herein are generated and the data analyzed. 

In one embodiment, the genes showing changes in expression as between normal and 
disease states are compared to genes expressed in other normal tissues, preferably normal 
lung, but also including, and not limited to colon, heart, brain, liver, breast, kidney, muscle, 
prostate, small intestine, large intestine, spleen, bone, and/or placenta. In a preferred 
1 0 embodiment, those genes identified during the lung cancer screen that are expressed in 
significant amounts in other tissues (e.g., essential organs) are removed from the profile, 
although in some embodiments, this is not necessary (e.g., where organs maybe dispensible 
at a later stage of life). That is, when screening for drugs, it is usually preferable that the 
target expression be disease specific, to minimize possible side effects on other organs. 
15 In a preferred embodiment, lung cancer sequences are those that are up-regulated in 

lung cancer; that is, the expression of these genes is higher in cancerous tissue than in normal 
lung or other tissue. "Up-regulation" as used herein means, when the ratio is presented as a 
number greater than one, that the ratio is greater than one, preferably 1.5 or greater, more 
preferably 2.0 or greater. Another embodiment is directed to sequences up-regulated in non- 
20 malignant conditions relative to normal. Unigene cluster identification numbers and 

accession numbers herein are for the GenBank sequence database and the sequences of the 
accession numbers are hereby expressly incorporated by reference. GenBank is known in the 
art, see, e.g., Benson, DA, et al (1998) Nucleic Acids Research 26:1-7 and 
http://www.ncbi.nlm.nih.gov/. Sequences are also available in other databases, e.g., 
25 European Molecular Biology Laboratory (EMBL) and DNA Database of Japan (DDBJ). 
Another embodiment is directed to sequences up-regulated in non-malignant conditions 
relative to normal. In some situations, the sequences may be derived from assembly of 
available sequences or be predicted from genomic DNA using exon prediction algorithms, 
such as FGENESH (Salamov and Solovyev (2000) Genome Res. 10:516-522). In other 
30 situations, sequences have been derived from cloning and sequencing of isolated nucleic 
acids. 

In another preferred embodiment, lung cancer sequences are those that are down- 
regulated in the lung cancer; that is, the expression of these genes is lower in cancerous tissue 
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or normal lung or other tissue. "Down-regulation" as used herein means, when the ratio is 
presented as a number greater than one, that the ratio is greater than one, preferably 1.5 or 
greater, more preferably 2.0 or greater, or, when the ratio is presented as a number less than 
one, that the ratio is less than one, preferably 0.5 or less, more preferably 0.25 or less. 

5 

Informatics 

The ability to identify genes that are over or under expressed in lung cancer can 
additionally provide high-resolution, high-sensitivity datasets which can be used in the areas 
of diagnostics, therapeutics, drug development, pharmacogenetics, protein structure, 

10 biosensor development, and other related areas. For example, the expression profiles can be 
used in diagnostic or prognostic evaluation of patients with lung cancer. Or as another 
example, subcellular toxicological information can be generated to better direct drug structure 
and activity correlation (see Anderson (1998) Pharmaceutical Proteomics: Targets. 
Mechanism, and Function, paper presented at the IBC Proteomics conference, Coronado, CA 

15 (June 1 1-12, 1998)). Subcellular toxicological information can also be utilized in a biological 
sensor device to predict the likely toxicological effect of chemical exposures and likely 
tolerable exposure thresholds (see U.S. Patent No. 5,811,231). Similar advantages accrue 
from datasets relevant to other biomolecules and bioactive agents (e.g., nucleic acids, 
saccharides, lipids, drugs, and the like). 

20 Thus, in another embodiment, the present invention provides a database that includes 

at least one set of assay data. The data contained in the database is acquired, e.g., using array 
analysis either singly or in a library format. The database can be in a form in which data can 
be maintained and transmitted, but is preferably an electronic database. The electronic 
database of the invention can be maintained on any electronic device allowing for the storage 

25 of and access to the database, such as a personal computer, but is preferably distributed on a 
wide area network, such as the World Wide Web. 

The focus of the present section on databases that include peptide sequence data is for 
clarity of illustration only. It will be apparent to those of skill in the art that similar databases 
can be assembled for assay data acquired using an assay of the invention. 

30 The compositions and methods for identifying and/or quantitating the relative and/or 

absolute abundance of a variety of molecular and macromolecular species from a biological 
sample representing lung cancer, i.e., the identification of lung cancer-associated sequences 
described herein, provide an abundance of information, which can be correlated with 
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pathological conditions, predisposition to disease, drug testing, therapeutic monitoring, gene- 
disease causal linkages, identification of correlates of immunity and physiological status, 
among others. Although the data generated from the assays of the invention is suited for 
manual review and analysis, in a preferred embodiment, data processing using high-speed 
5 computers is utilized. 

An array of methods for indexing and retrieving biomolecular information is known 
in the art. For example, U.S. Patents 6,023,659 and 5,966,712 disclose a relational database 
system for storing biomolecular sequence information in a manner that allows sequences to 
be catalogued and searched according to one or more protein function hierarchies. U.S. 

10 Patent 5,953,727 discloses a relational database having sequence records containing 
information in a format that allows a collection of partial-length DNA sequences to be 
catalogued and searched according to association with one or more sequencing projects for 
obtaining full-length sequences from the collection of partial length sequences. U.S. Patent 
5,706,498 discloses a gene database retrieval system for making a retrieval of a gene 

1 5 sequence similar to a sequence data item in a gene database based on the degree of similarity 
between a key sequence and a target sequence. U.S. Patent 5,538,897 discloses a method 
using mass spectroscopy fragmentation patterns of peptides to identify amino acid sequences 
in computer databases by comparison of predicted mass spectra with experimentally-derived 
mass spectra using a closeness-of-fit measure. U.S. Patent 5,926,818 discloses a multi- 

20 dimensional database comprising a functionality for multi-dimensional data analysis 
described as on-line analytical processing (OLAP), which entails the consolidation of 
projected and actual data according to more than one consolidation path or dimension. U.S. 
Patent 5,295,261 reports a hybrid database structure in which the fields of each database 
record are divided into two classes, navigational and informational data, with navigational 

25 fields stored in a hierarchical topological map which can be viewed as a tree structure or as 
the merger of two or more such tree structures. 

See also Mount, et al. (2001) Bioinformatics; Durbin, et al. (eds., 1999) Biological 
Sequence Analysis: Probabilistic Models of Proteins and Nucleic Acids (; Baxevanis and 
Oeullette (eds., 1998) Bioinformatics: A Practical Guide to the Analysis of Genes and 

3 0 Proteins ^ ; Rashidi and Buehler ( 1 999) Bioinformatics: Basic Application s in Biological 

Science and Medicine : Setubal, et al. (eds 1997) Introduction to Computational Molecular 
Biology : Misener and Krawetz (eds, 2000) Bioinformatics: Methods and Protocols : Higgins 
and Taylor (eds., 2000) Bioinformatics: Sequence. Structure, and Databanks : A Practical 
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Approach : Brown (2001) Bioinfortnatics: A Biologist's Guide to Biocomputing and the 
Internet : Han and Kamber (2000) Data Mining: Concepts and Techniques (2000); and 
Waterman (1995) Introduction to Computational Biology: Maps, Sequences, and Genomes . 
The present invention provides a computer database comprising a computer and 
5 software for storing in computer-retrievable form assay data records cross-tabulated, e.g., 
with data specifying the source of the target-containing sample from which each sequence 
specificity record was obtained. 

In an exemplary embodiment, at least one of the sources of target-containing sample 
is from a control tissue sample known to be free of pathological disorders. In a variation, at 

10 least one of the sources is a known pathological tissue specimen, e.g., a neoplastic lesion or 
another tissue specimen to be analyzed for lung cancer. In another variation, the assay 
records cross-tabulate one or more of the following parameters for each target species in a 
sample: (1) a unique identification code, which can include, e.g., a target molecular structure 
and/or characteristic separation coordinate (e.g., electrophoretic coordinates); (2) sample 

15 source; and (3) absolute and/or relative quantity of the target species present in the sample. 

The invention also provides for the storage and retrieval of a collection of target data 
in a computer data storage apparatus, which can include magnetic disks, optical disks, 
magneto-optical disks, DRAM, SRAM, SGRAM, SDRAM, RDRAM, DDR RAM, magnetic 
bubble memory devices, and other data storage devices, including CPU registers and on-CPU 

20 data storage arrays. Typically, the target data records are stored as a bit pattern in an array of 
magnetic domains on a magnetizable medium or as an array of charge states or transistor gate 
states, such as an array of cells in a DRAM device (e.g., each cell comprised of a transistor 
and a charge storage area, which may be on the transistor). In one embodiment, the invention 
provides such storage devices, and computer systems built therewith, comprising a bit pattern 

25 encoding a protein expression fingerprint record comprising unique identifiers for at least 10 
target data records cross-tabulated with target source. 

When the target is a peptide or nucleic acid, the invention preferably provides a 
method for identifying related peptide or nucleic acid sequences, comprising performing a 
computerized comparison between a peptide or nucleic acid sequence assay record stored in 

30 or retrieved from a computer storage device or database and at least one other sequence. The 
comparison can include a sequence analysis or comparison algorithm or computer program 
embodiment thereof (e.g., FASTA, TFASTA, GAP, BESTFIT) and/or the comparison may 
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be of the relative amount of a peptide or nucleic acid sequence in a pool of sequences 
determined from a polypeptide or nucleic acid sample of a specimen. 

The invention also preferably provides a magnetic disk, such as an IBM-compatible 
(DOS, Windows, Windows95/98/2000, Windows NT, OS/2) or other format (e.g., Linux, 
5 SunOS, Solaris, AIX, SCO Unix, VMS, MV, Macintosh, etc.) floppy diskette or hard (fixed, 
Winchester) disk drive, comprising a bit pattern encoding data from an assay of the invention 
in a file format suitable for retrieval and processing in a computerized sequence analysis, 
comparison, or relative quantitation method. 

The invention also provides a network, comprising a plurality of computing devices 

10 linked via a data link, such as an Ethernet cable (coax or lOBaseT), telephone line, ISDN 

line, wireless network, optical fiber, or other suitable signal transmission medium, whereby at 
least one network device (e.g., computer, disk array, etc.) comprises a pattern of magnetic 
domains (e.g., magnetic disk) and/or charge domains (e.g., an array of DRAM cells) 
composing a bit pattern encoding data acquired from an assay of the invention. 

15 The invention also provides a method for transmitting assay data that includes 

generating an electronic signal on an electronic communications device, such as a modem, 
ISDN terminal adapter, DSL, cable modem, ATM switch, or the like, wherein the signal 
includes (in native or encrypted format) a bit pattern encoding data from an assay or a 
database comprising a plurality of assay results obtained by the method of the invention. 

20 In a preferred embodiment, the invention provides a computer system for comparing a 

query target to a database containing an array of data structures, such as an assay result 
obtained by the method of the invention, and ranking database targets based on the degree of 
identity and gap weight to the target data. A central processor is preferably initialized to load 
and execute the computer program for alignment and/or comparison of the assay results. 

25 Data for a query target is entered into the central processor via an I/O device. Execution of 
the computer program results in the central processor retrieving the assay data from the data 
file, which comprises a binary description of an assay result. 

The target data or record and the computer program can be transferred to secondary 
memory, which is typically random access memory (e.g., DRAM, SRAM, SGRAM, or 

30 SDRAM). Targets are ranked according to the degree of correspondence between a selected 
assay characteristic (e.g., binding to a selected affinity moiety) and the same characteristic of 
the query target and results are output via an I/O device. For example, a central processor 
can be a conventional computer (e.g., Intel Pentium, PowerPC, Alpha, PA-8000, SPARC, 
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MIPS 4400, MIPS 10000, VAX, etc.); a program can be a commercial or public domain 
molecular biology software package (e.g., UWGCG Sequence Analysis Software, Darwin); a 
data file can be an optical or magnetic disk, a data server, a memory device (e.g., DRAM, 
SRAM, SGRAM, SDRAM, EPROM, bubble memory, flash memory, etc.); an I/O device can 
5 be a terminal comprising a video display and a keyboard, a modem, an ISDN terminal 

adapter, an Ethernet port, a punched card reader, a magnetic strip reader, or other suitable I/O 
device. 

The invention also preferably provides the use of a computer system, such as that 
described above, which comprises: (1) a computer; (2) a stored bit pattern encoding a 
10 collection of peptide sequence specificity records obtained by the methods of the invention, 
which may be stored in the computer; (3) a comparison target, such as a query target; and (4) 
a program for alignment and comparison, typically with rank-ordering of comparison results 
on the basis of computed similarity values. 

1 5 Characteristics of lung cancer-associated proteins 

Lung cancer proteins of the present invention may be classified as secreted proteins, 
transmembrane proteins or intracellular proteins. In one embodiment, the lung cancer protein 
is an intracellular protein. Intracellular proteins may be found in the cytoplasm and/or in the 
nucleus. Intracellular proteins are involved in all aspects of cellular function and replication 

20 (including, e.g., signaling pathways); aberrant expression of such proteins often results in 
unregulated or disregulated cellular processes (see, e.g., Alberts (ed. 1994) Molecular 
Biology of the Cell (3d ed.). For example, many intracellular proteins have enzymatic 
activity such as protein kinase activity, protein phosphatase activity, protease activity, 
nucleotide cyclase activity, polymerase activity and the like. Intracellular proteins also serve 

25 as docking proteins that are involved in organizing complexes of proteins, or targeting 

proteins to various subcellular localizations, and are involved in maintaining the structural 
integrity of organelles. 

An increasingly appreciated concept in characterizing proteins is the presence in the 
proteins of one or more structural motifs for which defined functions have been attributed. In 

30 addition to the highly conserved sequences found in the enzymatic domain of proteins, highly 
conserved sequences have been identified in proteins that are involved in protein-protein 
interaction. For example, Src-homology-2 (SH2) domains bind tyrosine-phosphorylated 
targets in a sequence dependent manner. PTB domains, which are distinct from SH2 
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domains, also bind tyrosine phosphorylated targets. SH3 domains bind to proline-rich 
targets. In addition, PH domains, tetratricopeptide repeats and WD domains to name only a 
few, have been shown to mediate protein-protein interactions. Some of these may also be 
involved in binding to phospholipids or other second messengers. As will be appreciated by 
5 one of ordinary skill in the art, these motifs can be identified on the basis of amino acid 
sequence; thus, an analysis of the sequence of proteins may provide insight into both the 
enzymatic potential of the molecule and/or molecules with which the protein may associate. 
One useful database is Pfam (protein families), which is a large collection of multiple 
sequence alignments and hidden Markov models covering many common protein domains. 
10 Versions are available via the internet from Washington University in St. Louis, the Sanger 
Center in England, and the Karolinska Institute in Sweden (see, e.g., Bateman, et al (2000) 
Nuc. Acids Res. 28:263-266; Sonnhammer, et al. (1997) Proteins 28:405-420; Bateman, et al. 
(1999) Nuc. Acids Res. 27:260-262; and Sonnhammer, et al. (1998) Nuc. Acids Res. 26:320- 
322). 

15 In another embodiment, the lung cancer sequences are transmembrane proteins. 

Transmembrane proteins are molecules that span a phospholipid bilayer of a cell. They may 
have an intracellular domain, an extracellular domain, or both. The intracellular domains of 
such proteins may have a number of functions including those already described for 
intracellular proteins. For example, the intracellular domain may have enzymatic activity 

20 and/or may serve as a binding site for additional proteins. Frequently the intracellular 

domain of transmembrane proteins serves both roles. For example certain receptor tyrosine 
kinases have both protein kinase activity and SH2 domains. In addition, autophosphorylation 
of tyrosines on the receptor molecule itself, creates binding sites for additional SH2 domain 
containing proteins. 

25 Transmembrane proteins may contain from one to many transmembrane domains. 

For example, receptor tyrosine kinases, certain cytokine receptors, receptor guanylyl cyclases 
and receptor serine/threonine protein kinases contain a single transmembrane domain. 
However, various other proteins including channels, pumps, and adenylyl cyclases contain 
numerous transmembrane domains. Many important cell surface receptors such as G protein 

30 coupled receptors (GPCRs) are classified as "seven transmembrane domain" proteins, as they 
contain 7 membrane spanning regions. Characteristics of transmembrane domains include 
approximately 17 consecutive hydrophobic amino acids that may be followed by charged 
amino acids. Therefore, upon analysis of the amino acid sequence of a particular protein, the 

i 
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localization and number of transmembrane domains within the protein may be predicted (see, 
e.g., PSORT web site http://psort.nibb.ac.jp/). 

The extracellular domains of transmembrane proteins are diverse; however, conserved 
motifs are found repeatedly among various extracellular domains. Conserved structure 
5 and/or functions have been ascribed to different extracellular motifs. Many extracellular 

domains are involved in binding to other molecules. In one aspect, extracellular domains are 
found on receptors. Factors that bind the receptor domain include circulating ligands, which 
may be peptides, proteins, or small molecules such as adenosine and the like. For example, 
growth factors such as EGF, FGF, and PDGF are circulating growth factors that bind to their 

10 cognate receptors to initiate a variety of cellular responses. Other factors include cytokines, 
mitogenic factors, hormones, neurotrophic factors and the like. Extracellular domains also 
bind to cell-associated molecules. In this respect, they may mediate cell-cell interactions. 
Cell-associated ligands can be tethered to the cell, e.g., via a glycosylphosphatidylinositol 
(GPI) anchor, or may themselves be transmembrane proteins. Extracellular domains may 

15 also associate with the extracellular matrix and contribute to the maintenance of the cell 
structure. 

Lung cancer proteins that are transmembrane are particularly preferred in the present 
invention as they are readily accessible targets for extracellular immunotherapeutics, as are 
described herein. In addition, as outlined below, transmembrane proteins can be also useful 

20 in imaging modalities. Antibodies may be used to label such readily accessible proteins in 
situ or in histological analysis. Alternatively, antibodies can also label intracellular proteins, 
in which case analytical samples are typically permeablized to provide access to intracellular 
proteins. In addition, some membrane proteins can be processed to release a soluble protein, 
or to expose a residual fragment. Released soluble proteins may be useful diagnostic 

25 markers, processed residual protein fragments may be useful lung markers of disease. 

It will also be appreciated by those in the art that a transmembrane protein can be 
made soluble by removing transmembrane sequences, e.g., through recombinant methods. 
Furthermore, transmembrane proteins that have been made soluble can be made to be 
secreted through recombinant means by adding an appropriate signal sequence. 

30 In another embodiment, the lung cancer proteins are secreted proteins; the secretion of 

which can be either constitutive or regulated. These proteins may have a signal peptide or 
signal sequence that targets the molecule to the secretory pathway. Secreted proteins are 
involved in numerous physiological events; e.g., if circulating, they often serve to transmit 
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signals to various other cell types. The secreted protein may function in an autocrine manner 
(acting on the cell that secreted the factor), a paracrine manner (acting on cells in close 
proximity to the cell that secreted the factor), an endocrine manner (acting on cells at a 
distance, e.g., secretion into the blood stream), or exocrine (secretion, e.g., through a duct or 
5 to adjacent epithelial surface as sweat glands, sebaceous glands, pancreatic ducts, lacrimal 
glands, mammary glands, sax producing glands of the ear, etc.). Thus secreted molecules 
often find use in modulating or altering numerous aspects of physiology. Lung cancer 
proteins that are secreted proteins are particularly preferred in the present invention as they 
serve as good targets for diagnostic markers, e.g., for blood, plasma, serum, or stool tests. 
10 Those which are enzymes may be antibody or small molecule targets. Others may be useful 
as vaccine targets, e.g., via CTL mechanisms. 

Use of lung cancer nucleic acids 

As described above, lung cancer sequence is initially identified by substantial nucleic 
15 acid and/or amino acid sequence homology or linkage to the lung cancer sequences outlined 
herein. Such homology can be based upon the overall nucleic acid or amino acid sequence, 
and is generally determined as outlined below, using either homology programs or 
hybridization conditions. Typically, linked sequences on a mRNA are found on the same 
molecule. 

20 The lung cancer nucleic acid sequences of the invention, e.g., the sequences in Tables 

1A-16, can be fragments of larger genes, i.e., they are nucleic acid segments. "Genes" in this 
context includes coding regions, non-coding regions, and mixtures of coding and non-coding 
regions. Accordingly, as will be appreciated by those in the art, using the sequences provided 
herein, extended sequences, in either direction, of the lung cancer genes can be obtained, 

25 using techniques well known in the art for cloning either longer sequences or the full length 
sequences; see Ausubel, et al., supra. Much can be done by informatics and many sequences 
can be clustered to include multiple sequences corresponding to a single gene, e.g., systems 
such as UniGene (see, http://www.ncbi.nlm.nih.gov/UniGene/). 

Once a lung cancer nucleic acid is identified, it can be cloned and, if necessary, its 

30 constituent parts recombined to form the entire lung cancer nucleic acid coding regions or the 
entire mRNA sequence. Once isolated from its natural source, e.g., contained within a 
plasmid or other vector or excised therefrom as a linear nucleic acid segment, the 
recombinant lung cancer nucleic acid can be further-used as a probe to identify and isolate 
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other lung cancer nucleic acids, e.g., extended coding regions. It can also be used as a 
"precursor" nucleic acid to make modified or variant lung cancer nucleic acids and proteins. 

The lung cancer nucleic acids of the present invention are used in several ways. In a 
first embodiment, nucleic acid probes to the lung cancer nucleic acids are made and attached 
5 to biochips to be used in screening and diagnostic methods, as outlined below, or for 
administration, e.g., for gene therapy, RNAi, vaccine, and/or antisense applications. 
Alternatively, the lung cancer nucleic acids that include coding regions of lung cancer 
proteins can be put into expression vectors for the expression of lung cancer proteins, again 
for screening purposes or for administration to a patient. 

10 In a preferred embodiment, nucleic acid probes to lung cancer nucleic acids (both the 

nucleic acid sequences outlined in the figures and/or the complements thereof) are made. 
The nucleic acid probes attached to the biochip are designed to be substantially 
complementary to the lung cancer nucleic acids, i.e., the target sequence (either the target 
sequence of the sample or to other probe sequences, e.g., in sandwich assays), such that 

1 5 hybridization of the target sequence and the probes of the present invention occurs. As 

outlined below, this complementarity need not be perfect; there may be any number of base 
pair mismatches which will interfere with hybridization between the target sequence and the 
single stranded nucleic acids of the present invention. However, if the number of mutations 
is so great that no hybridization can occur under even the least stringent of hybridization 

20 conditions, the sequence is not a complementary target sequence. Thus, by "substantially 
complementary" herein is meant that the probes are sufficiently complementary to the target 
sequences to hybridize under appropriate reaction conditions, particularly high stringency 
conditions, as outlined herein. 

A nucleic acid probe is generally single stranded but can be partially single and 

25 partially double stranded. The strandedness of the probe is dictated by the structure, 

composition, and properties of the target sequence. In general, the nucleic acid probes range 
from about 8 to about 100 bases long, with from about 10 to about 80 bases being preferred, 
and from about 30 to about 50 bases being particularly preferred. That is, generally 
complements of ORFs or whole genes are not used. In some embodiments, nucleic acids of 

30 lengths up to hundreds of bases can be used. 

In a preferred embodiment, more than one probe per sequence is used, with either 
overlapping probes or probes to different sections of the target being used. That is, two, 
three, four or more probes, with three being preferred, are used to build in a redundancy for a 
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particular target. The probes can be overlapping (i.e., have some sequence in common), or 
separate. In some cases, PCR primers may be used to amplify signal for higher sensitivity. 

As will be appreciated by those in the art, nucleic acids can be attached or 
immobilized to a solid support in a wide variety of ways. By "immobilized" and grammatical 
5 equivalents herein is meant the association or binding between the nucleic acid probe and the 
solid support is sufficient to be stable under the conditions of binding, washing, analysis, and 
removal as outlined below. The binding can typically be covalent or non-covalent. By "non- 
covalent binding" and grammatical equivalents herein is typically meant one or more of 
electrostatic, hydrophilic, and hydrophobic interactions. Included in non-covalent binding is 
1 0 the covalent attachment of a molecule, such as, streptavidin to the support and the non- 

■4 

covalent binding of the biotinylated probe to the streptavidin. By "covalent binding" and 
grammatical equivalents herein is meant that the two moieties, the solid support and the 
probe, are attached by at least one bond, including sigma bonds, pi bonds and coordination 
bonds. Covalent bonds can be formed directly between the probe and the solid support or can 

15 be formed by a cross linker or by inclusion of a specific reactive group on either the solid 
support or the probe or both molecules. Immobilization may also involve a combination of 
covalent and non-covalent interactions. 

In general, the probes are attached to a biochip in a wide variety of ways, as will be 
appreciated by those in the art. As described herein, the nucleic acids can either be 

20 synthesized first, with subsequent attachment to the biochip, or can be directly synthesized on 
the biochip. 

The biochip comprises a suitable solid substrate. By "substrate" or "solid support" or 
other grammatical equivalents herein is meant a material that can be modified for the 
attachment or association of the nucleic acid probes and is amenable to at least one detection 

25 method. Often the substrate may contain discrete individual sites appropriate for ndivitual 
partitioning and identification. As will be appreciated by those in the art, the number of 
possible substrates are very large, and include, but are not limited to, glass and modified or 
functionalized glass, plastics (including acrylics, polystyrene and copolymers of styrene and 
other materials, polypropylene, polyethylene, polybutylene, polyurethanes, Teflon, etc.), 

30 polysaccharides, nylon or nitrocellulose, resins, silica or silica-based materials including 
silicon and modified silicon, carbon, metals, inorganic glasses, plastics, etc. Li general, the 
substrates allow optical detection and do not appreciably fluoresce. A preferred substrate is 
described in US application entitled Reusable Low Fluorescent Plastic Biochip, U.S. 
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Application Serial No. 09/270,214, filed March 15, 1999, herein incorporated by reference in 
its entirety. 

Generally the substrate is planar, although as will be appreciated by those in the art, 
other configurations of substrates may be used as well. For example, the probes may be 
5 placed on the inside surface of a tube, for flow-through sample analysis to minimize sample 
volume. Similarly, the substrate may be flexible, such as a flexible foam, including closed 
cell foams made of particular plastics. 

In a preferred embodiment, the surface of the biochip and the probe may be 
derivatized with chemical functional groups for subsequent attachment of the two. Thus, e.g., 

10 the biochip is derivatized with a chemical functional group including, but not limited to, 
amino groups, carboxy groups, oxo groups and thiol groups, with amino groups being 
particularly preferred. Using these functional groups, the probes can be attached using 
functional groups on the probes. For example, nucleic acids containing amino groups can be 
attached to surfaces comprising amino groups, e.g., using linkers as are known in the art; e.g., 

15 homo-or hetero-biflinctional linkers as are well known (see 1994 Pierce Chemical Company 
catalog, technical section on cross-linkers, pages 155-200). In addition, in some cases, 
additional linkers, such as alkyl groups (including substituted and heteroalkyl groups) may be 
used. 

In this embodiment, oligonucleotides are synthesized, and then attached to the surface 
20 of the solid support. Either the 5' or 3' terminus may be attached to the solid support, or 

attachment may be via linkage to an internal nucleoside. 

In another embodiment, the immobilization to the solid support may be very strong, 

yet non-covalent. For example, biotinylated oligonucleotides can be made, which bind to 

surfaces covalently coated with streptavidin, resulting in attachment. 
25 Alternatively, the oligonucleotides may be synthesized on the surface, as is known in 

the art. For example, photoactivation techniques utilizing photopolymerization compounds 

and techniques are used. In a preferred embodiment, the nucleic acids can be synthesized in 

situ, using known photolithographic techniques, such as those described in WO 95/251 16; 

WO 95/35505; U.S. Patent Nos. 5,700,637 and 5,445,934; and references cited within, all of 
30 which are expressly incorporated by reference; these methods of attachment form the basis of 

the Affymetrix GeneChip™ technology. 

Often, amplification-based assays are performed to measure the expression level of 

lung cancer-associated sequences. These assays are typically performed in conjunction with 
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reverse transcription. In such assays, a lung cancer-associated nucleic acid sequence acts as a 
template in an amplification reaction (e.g., Polymerase Chain Reaction, or PGR). In a 
quantitative amplification, the amount of amplification product will be proportional to the 
amount of template in the original sample. Comparison to appropriate controls provides a 
5 measure of the amount of lung cancer-associated RNA. Methods of quantitative 

amplification are well known to those of skill in the art. Detailed protocols for quantitative 
PGR are provided, e.g., in Innis, et al. (1990) PGR Protocols. A Guide to Methods and 
Applications . 

In some embodiments, a TaqMan based assay is used to measure expression. 

10 TaqMan based assays use a fluorogenic oligonucleotide probe that contains a 5' fluorescent 
dye and a 3 5 quenching agent. The probe hybridizes to a PCR product, but cannot itself be 
extended due to a blocking agent at the 3 ' end. When the PCR product is amplified in 
subsequent cycles, the 5' nuclease activity of the polymerase, e.g., AmpliTaq, results in the 
cleavage of the TaqMan probe. This cleavage separates the 5 5 fluorescent dye and the 3' 

1 5 quenching agent, thereby resulting in an increase in fluorescence as a function of 

amplification (see, e.g., literature provided by Perkin-Elmer, e.g., www2.perkin-elmer.com). 

Other suitable amplification methods include, but are not limited to, ligase chain 
reaction (LCR) (see Wu and Wallace (1989) Genomics 4:560, Landegren, et al. (1988) 
Science 241:1077, and Barringer, et al. (1990) Gene 89:117), transcription amplification 

20 (Kwoh, et al. (1989) Proc. Natl. Acad. Sci. USA 86:1 173), self-sustained sequence 

replication (Guatelli, et al. (1990) Proc. Nat. Acad. Sci. USA 87:1874), dot PCR, and linker 
adapter PCR, etc. 

Expression of lung caneer proteins from nucleic acids 

25 In a preferred embodiment, lung cancer nucleic acids, e.g., encoding lung cancer 

proteins, are used to make a variety of expression vectors to express lung cancer proteins 
which can then be used in screening assays, as described below. Expression vectors and 
recombinant DNA technology are well known to those of skill in the art (see, e.g., Ausubel, 
supra, and Fernandez and Hoeffler (eds 1999) Gene Expression Systems) and are used to 

30 express proteins. The expression vectors may be either self-replicating extrachromosomal 
vectors or vectors which integrate into a host genome. Generally, these expression vectors 
include transcriptional and translational regulatory nucleic acid operably linked to the nucleic 
acid encoding the lung cancer protein. The term "control sequences" refers to DNA 

38 



WO 02/086443 PCT/US02/12476 

sequences used for the expression of an operably linked coding sequence in a particular host 
organism. Control sequences that are suitable for prokaryotes, e.g., include a promoter, 
optionally an operator sequence, and a ribosome binding site. Eukaryotic cells are known to 
utilize promoters, polyadenylation signals, and enhancers. 
5 Nucleic acid is "operably linked" when it is placed into a functional relationship with 

another nucleic acid sequence. For example, DNA for a presequence or secretory leader is 
operably linked to DNA for a polypeptide if it is expressed as a preprotein that participates in 
the secretion of the polypeptide; a promoter or enhancer is operably linked to a coding 
sequence if it affects the transcription of the sequence; or a ribosome binding site is operably 

10 linked to a coding sequence if it is positioned so as to facilitate translation. Generally, 

"operably linked" means that the DNA sequences being linked are contiguous, and, in the 
case of a secretory leader, contiguous and in reading phase. However, enhancers do not have 
to be contiguous. Linking is typically accomplished by ligation at convenient restriction 
sites. If such sites do not exist, synthetic oligonucleotide adaptors or linkers are used in 

1 5 accordance with conventional practice. Transcriptional and translational regulatory nucleic 
acid will generally be appropriate to the host cell used to express the lung cancer protein. 
Numerous types of appropriate expression vectors, and suitable regulatory sequences are 
known in the art for a variety of host cells. 

In general, transcriptional and translational regulatory sequences may include, but are 

20 not limited to, promoter sequences, ribosomal binding sites, transcriptional start and stop 

sequences, translational start and stop sequences, and enhancer or activator sequences. In a 
preferred embodiment, the regulatory sequences include a promoter and transcriptional start 
and stop sequences. 

Promoter sequences may be either constitutive or inducible promoters. The promoters 
25 may be either naturally occurring promoters or hybrid promoters. Hybrid promoters, which 
combine elements of more than one promoter, are also known in the art, and are useful in the 
present invention. 

In addition, an expression vector may comprise additional elements. For example, the 
expression vector may have two replication systems, thus allowing it to be maintained in two 
30 organisms, e.g., in mammalian or insect cells for expression and in a prokaryotic host for 
cloning and amplification. Furthermore, for integrating expression vectors, the expression 
vector often contains at least one sequence homologous to the host cell genome, and 
preferably two homologous sequences which flank the expression construct. The integrating 
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vector may be directed to a specific locus in the host cell by selecting the appropriate 
homologous sequence for inclusion in the vector. Constructs for integrating vectors are well 
known in the art (e.g., Fernandez and Hoeffler, supra). 

In addition, in a preferred embodiment, the expression vector contains a selectable 
5 marker gene to allow the selection of transformed host cells. Selection genes are well known 
in the art and will vary with the host cell used. 

The lung cancer proteins of the present invention are usually produced by culturing a 
host cell transformed with an expression vector containing nucleic acid encoding a lung 
cancer protein, under the appropriate conditions to induce or cause expression of the lung 

1 0 cancer protein. Conditions appropriate for lung cancer protein expression will vary with the 
choice of the expression vector and the host cell, and will be easily ascertained by one skilled 
in the art through routine experimentation or optimization. For example, the use of 
constitutive promoters in the expression vector will require optimizing the growth and 
proliferation of the host cell, while the use of an inducible promoter requires the appropriate 

15 growth conditions for induction. In addition, in some embodiments, the timing of the harvest 
is important. For example, the baculoviral systems used in insect cell expression are lytic 
viruses, and thus harvest time selection can be crucial for product yield. 

Appropriate host cells include yeast, bacteria, archaebacteria, fungi, and insect and 
animal cells, including mammalian cells. Of particular interest are Saccharomyces cerevisiae 

20 and other yeasts, E. coli, Bacillus subtilis, Sf9 cells, CI 29 cells, 293 cells, Neurospora, BHK, 
CHO, COS, HeLa cells, HUVEC (human umbilical vein endothelial cells), THP1 cells (a 
macrophage cell line) and various other human cells and cell lines. 

In a preferred embodiment, the lung cancer proteins are expressed in mammalian 
cells. Mammalian expression systems are also known in the art, and include retroviral and 

25 adenoviral systems. Of particular use as mammalian promoters are the promoters from 
mammalian viral genes, since the viral genes are often highly expressed and have a broad 
host range. Examples include the SV40 early promoter, mouse mammary tumor virus LTR 
promoter, adenovirus major late promoter, herpes simplex virus promoter, and the CMV 
promoter (see, e.g., Fernandez and Hoeffler, supra). Typically, transcription termination and 

30 polyadenylation sequences recognized by mammalian cells are regulatory regions located 3' 
to the translation stop codon and thus, together with the promoter elements, flank the coding 
sequence. Examples of transcription terminator and polyadenylation signals include those 
derived form SV40. 
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The methods of introducing exogenous nucleic acid into mammalian hosts, as well as 
other hosts, is well known in the art, and will vary with the host cell used. Techniques 
include dextran-mediated transfection, calcium phosphate precipitation, polybrene mediated 
transfection, protoplast fusion, electroporation, viral infection, encapsulation of the 
polynucleotide(s) in liposomes, and direct microinjection of the DNA into nuclei. 

In a preferred embodiment, lung cancer proteins are expressed in bacterial systems. 
Promoters from bacteriophage may also be used and are known in the art. In addition, 
synthetic promoters and hybrid promoters are also useful; e.g., the tac promoter is a hybrid of 
the trp and lac promoter sequences. Furthermore, a bacterial promoter can include naturally 
occurring promoters of non-bacterial origin that have the ability to bind bacterial RNA 
polymerase and initiate transcription. In addition to a functioning promoter sequence, an 
efficient ribosome binding site is desirable. The expression vector may also include a signal 
peptide sequence that provides for secretion of the lung cancer protein in bacteria. The 
protein is either secreted into the growth media (gram-positive bacteria) or into the 
periplasmic space, located between the inner and outer membrane of the cell (gram-negative 
bacteria). The bacterial expression vector may also include a selectable marker gene to allow 
for the selection of bacterial strains that have been transformed. Suitable selection genes 
include genes which render the bacteria resistant to drugs such as ampicillin, 
chloramphenicol, erythromycin, kanamycin, neomycin and tetracycline. Selectable markers 
also include biosynthetic genes, such as those in the histidine, tryptophan and leucine 
biosynthetic pathways. These components are assembled into expression vectors. Expression 
vectors for bacteria are well known in the art, and include vectors for Bacillus subtilis, E. 
coli, Streptococcus cremoris, and Streptococcus lividans, among others (e.g., Fernandez and 
Hoeffler, supra). The bacterial expression vectors are transformed into bacterial host cells 
using techniques well known in the art, such as calcium chloride treatment, electroporation, 
and others. 

In one embodiment, lung cancer proteins are produced in insect cells. Expression 
vectors for the transformation of insect cells, and in particular, baculo virus-based expression 
vectors, are well known in the art. 

In a preferred embodiment, lung cancer protein is produced in yeast cells. Yeast 
expression systems are well known in the art, and include expression vectors for 
Saccharomyces cerevisiae, Candida albicans and C. maltosa, Hansenula polymorpha, 
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Kluyveromyces fragilis and K. lactis, Pichia guillerimondii, and P. pastor is, 
Schizosaccharomyces pornbe, and Yarrowia lipolytica. 

The lung cancer protein may also be made as a fusion protein, using techniques well 
known in the art. Thus, e.g., for the creation of monoclonal antibodies, if the desired epitope 
5 is small, the lung cancer protein may be fused to a carrier protein to form an immunogen. 
Alternatively, the lung cancer protein may be made as a fusion protein to increase expression 
for affinity purification purposes, or for other reasons. For example, when the lung cancer 
protein is a lung cancer peptide, the nucleic acid encoding the peptide may be linked to other 
nucleic acid for expression purposes. 

10 In a preferred embodiment, the lung cancer protein is purified or isolated after 

expression. Lung cancer proteins may be isolated or purified in a variety of appropriate 
ways. Standard purification methods include electrophoretic, molecular, immunological and 
chromatographic techniques, including ion exchange, hydrophobic, affinity, and reverse- 
phase HPLC chromatography, and chromatofocusing. For example, the lung cancer protein 

1 5 may be purified using a standard anti-lung cancer protein antibody column. Ultrafiltration 
and diafiltration techniques, in conjunction with protein concentration, are also useful. For 
general guidance in suitable purification techniques, see Scopes (1982) Protein Purification . 
The degree of purification necessary will vary depending on the use of the lung cancer 
protein. In some instances no purification will be necessary. 

20 Once expressed and purified if necessary, the lung cancer proteins and nucleic acids 

are useful in a number of applications. They may be used as immunoselection reagents, as 
vaccine reagents, as screening agents, therapeutic entities, for production of antibodies, as 
transcription or translation inhibitors, etc. 

25 Variants of lung cancer proteins 

In one embodiment, the lung cancer proteins are derivative or variant lung cancer 
proteins as compared to the wild-type sequence. That is, as outlined more fully below, the 
derivative lung cancer peptide will often contain at least one amino acid substitution, deletion 
or insertion, with amino acid substitutions being particularly preferred. The amino acid 
30 substitution, insertion or deletion may occur at a particular residue within the lung cancer 
peptide. 

Also included within one embodiment of lung cancer proteins of the present invention 
are amino acid sequence variants. These variants typically fall into one or more of three 
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classes: substitutional, insertional or deletional variants. These variants ordinarily are 
prepared by site specific mutagenesis of nucleotides in the DNA encoding the lung cancer 
protein, using cassette or PCR mutagenesis or other techniques, to produce DNA encoding 
the variant, and thereafter expressing the DNA in recombinant cell culture as outlined above. 
5 However, variant lung cancer protein fragments having up to about 100-150 residues may be 
prepared by in vitro synthesis. Amino acid sequence variants are characterized by the 
predetermined nature of the variation, a feature that sets them apart from naturally occurring 
allelic or interspecies variation of the lung cancer protein amino acid sequence. The variants 
typically exhibit a similar qualitative biological activity as the naturally occurring analogue, 
10 although variants can also be selected which have modified characteristics as will be more 
fully outlined below. 

* 

While the site or region for introducing an amino acid sequence variation is often 
predetermined, the mutation per se need not be predetermined. For example, in order to 
optimize the performance of a mutation at a given site, random mutagenesis may be 
1 5 conducted at the target codon or region and the expressed lung cancer variants screened for 
the optimal combination of desired activity. Techniques exist for making substitution 
mutations at predetermined sites in DNA having a known sequence, e.g., Ml 3 primer 
mutagenesis and PCR mutagenesis. Screening of mutants is often done using assays of lung 
cancer protein activities. 

20 Amino acid substitutions are typically of single residues; insertions usually will be on 

the order of from about 1 to 20 amino acids, although considerably larger insertions may be 
occasionally tolerated. Deletions generally range from about 1 to about 20 residues, although 
in some cases deletions may be much larger. 

Substitutions, deletions, insertions or any combination thereof may be used to arrive 

25 at a final derivative. Generally these changes are done on a few amino acids to minimize the 
alteration of the molecule. Larger changes may be tolerated in certain circumstances. When 
small alterations in the characteristics of a lung cancer protein are desired, substitutions are 
generally made in accordance with the amino acid substitution chart provided in the 
definition section. 

30 Variants typically exhibit essentially the same qualitative biological activity and will 

elicit the same immune response as a naturally-occurring analog, although variants also are 
selected to modify the characteristics of lung cancer proteins as needed. Alternatively, the 
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variant may be designed or reorganized such that a biological activity of the lung cancer 
protein is altered. For example, glycosylation sites may be added, altered, or removed. 

Covalent modifications of lung cancer polypeptides are included within the scope of 
this invention. One type of covalent modification includes reacting targeted amino acid 
5 residues of a lung cancer polypeptide with an organic derivatizing agent that is capable of 
reacting with selected side chains or the N-or C-terminal residues of a lung cancer 
polypeptide. Derivatization with bifunctional agents is useful, for instance, for crosslinking 
lung cancer polypeptides to a water-insoluble support matrix or surface for use in a method 
for purifying anti-lung cancer polypeptide antibodies or screening assays, as is more fully 

10 described below. Commonly used crosslinking agents include, e.g., l,l-bis(diazoacetyl)-2- 
phenylethane, glutaraldehyde, N-hydroxysuccinimide esters, e.g., esters with 4-azidosalicylic 
acid, homobifunctional imidoesters, including disuccinimidyl esters such as 3,3'- 
dithiobis(succinimidylpropionate), bifunctional maleimides such as bis-N-maleimido-1,8- 
octane and agents such as methyl-3-((p-azidophenyl)dithio)propipimidate. 

15 Other modifications include deamidation of glutaminyl and asparaginyl residues to 

the corresponding glutamyl and aspartyl residues, respectively, hydroxylation of proline and 
lysine, phosphorylation of hydroxyl groups of serinyl, threonyl or tyrosyl residues, 
methylation of the y-amino groups of lysine, arginine, and histidine side chains (Creighton 
(1983) Proteins: Structure and Molecular Properties , pp. 79-86), acetylation of the N-terminal 

20 amine, and amidation of any C-terminal carboxyl group. 

Another type of covalent modification of the lung cancer polypeptide encompassed by 
this invention is an altered native glycosylation pattern of the polypeptide. "Altering the 
native glycosylation pattern" is intended herein to mean adding to or deleting one or more 
carbohydrate moieties of a native sequence lung cancer polypeptide. Glycosylation patterns 

25 can be altered in many ways. For example the use of different cell types to express lung 
cancer-associated sequences can result in different glycosylation patterns. 

Addition of glycosylation sites to lung cancer polypeptides may also be accomplished 
by altering the amino acid sequence thereof. The alteration may be made, e.g., by the 
addition of, or substitution by, one or more serine or threonine residues to the native sequence 

30 lung cancer polypeptide (for O-linked glycosylation sites). The lung cancer amino acid 
sequence may optionally be altered through changes at the DNA level, particularly by 
mutating the DNA encoding the lung cancer polypeptide at preselected bases such that 
codons are generated that will translate into the desired amino acids. 
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Another means of increasing the number of carbohydrate moieties on the lung cancer 
polypeptide is by chemical or enzymatic coupling of glycosides to the polypeptide. Such 

« 

methods are described in the art, e.g., in WO 87/05330, and in Aplin and Wriston (1981) 
CRC Crit. Rev. Biochem. , pp. 259-306. 
5 Removal of carbohydrate moieties present on the lung cancer polypeptide may be 

accomplished chemically or enzymatically or by mutational substitution of codons encoding 
for amino acid residues that serve as targets for glycosylation. Chemical deglycosylation 
techniques are known in the art and described, for instance, by Hakimuddin, et al. (1987) 
Arch. Biochem. Biophvs.. 259:52 and by Edge, et al. (1981) Anal. Biochem. , 118:131. 
10 Enzymatic cleavage of carbohydrate moieties on polypeptides can be achieved by the use of a 
variety of endo-and exo-glycosidases as described by Thotakura, et al. (1987) Meth. 
Enzymol. . 138:350. 

Another type of covalent modification of lung cancer comprises linking the lung 
cancer polypeptide to one of a variety of nonproteinaceous polymers, e.g., polyethylene 

15 glycol, polypropylene glycol, or polyoxyalkylenes, in the manner set forth in U.S. Patent 
Nos. 4,640,835; 4,496,689; 4,301,144; 4,670,417; 4,791,192, or 4,179,337. 

Lung cancer polypeptides of the present invention may also be modified in a way to 
form chimeric molecules comprising a lung cancer polypeptide fused to another, 
heterologous polypeptide or amino acid sequence. In one embodiment, such a chimeric 

20 molecule comprises a fusion of a lung cancer polypeptide with a tag polypeptide which 
provides an epitope to which an anti-tag antibody can selectively bind. The epitope tag is 
generally placed at the amino-or carboxyl-terminus of the lung cancer polypeptide. The 
presence of such epitope-tagged forms of a lung cancer polypeptide can be detected using an 
antibody against the tag polypeptide. Also, provision of the epitope tag enables the lung 

25 cancer polypeptide to be readily purified by affinity purification using an anti-tag antibody or 
another type of affinity matrix that binds to the epitope tag. In an alternative embodiment, 
the chimeric molecule may comprise a fusion of a lung cancer polypeptide with an 
immunoglobulin or a particular region of an immunoglobulin. For a bivalent form of the 
chimeric molecule, such a fusion could be to the Fc region of an IgG molecule. 

30 Various tag polypeptides and their respective antibodies are well known and examples 

include poly-histidine (poly-his) or poly-histidine-glycine (poly-his-gly) tags; HIS 6 and metal 
chelation tags, the flu HA tag polypeptide and its antibody 12CA5 (Field, et al. (1988) Mol. 
Cell. Biol. 8:2159-2165); the c-myc tag and the 8F9, 3C7, 6E10, G4, B7 and 9E10 antibodies 
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thereto (Evan, et al. (1985) Molecular and Cellular Biology 5:3610-3616); and the Herpes 
Simplex virus glycoprotein D (gD) tag and its antibody (Paborsky, et al. (1990) Protein 
Engineering 3(6):547-553). Other tag polypeptides include the Flag-peptide (Hopp, et al. 
(1988) BioTechnologv 6:1204-1210); the KT3 epitope peptide (Martin, et al. (1992) Science 
5 255:192-194); tubulin epitope peptide (Skinner, et al. (1991) J. Biol. Chem. 266:15163- 
15166); and the T7 gene 10 protein peptide tag (Lutz-Freyermuth, et al. (1990) Proc. Nat'l 
Acad. Sci. USA 87:6393-6397). 

Also included are other lung cancer proteins of the lung cancer family, and lung 
cancer proteins from other organisms, which are cloned and expressed as outlined below. 

10 Thus, probe or degenerate polymerase chain reaction (PCR) primer sequences may be used to 
find other related lung cancer proteins from primates or other organisms. As will be 
appreciated by those in the art, particularly useful probe and/or PCR primer sequences 
include unique areas of the lung cancer nucleic acid sequence. As is generally known in the 
art, preferred PCR primers are from about 15 to about 35 nucleotides in length, with from 

15 about 20 to about 30 being preferred, and may contain inosine as needed. PCR reaction 
conditions are well known in the art (e.g., Innis, PCR Protocols, supra). 

Antibodies to lung cancer proteins 

In a preferred embodiment, when a lung cancer protein is to be used to generate 
20 antibodies, e.g., for immunotherapy or immunodiagnosis, the lung cancer protein should 
share at least one epitope or determinant with the full length protein. By "epitope" or 
"determinant" herein is typically meant a portion of a protein which will generate and/or bind 
an antibody or T-cell receptor in the context of MHC. Thus, in most instances, antibodies 
made to a smaller lung cancer protein will be able to bind to the full-length protein, 
25 particularly linear epitopes. In a preferred embodiment, the epitope is unique; that is, 
antibodies generated to a unique epitope show little or no cross-reactivity. 

Methods of preparing polyclonal antibodies are well known (e.g., Coligan, supra; and 
Harlow and Lane, supra). Polyclonal antibodies can be raised in a mammal, e.g., by one or 
more injections of an immunizing agent and, if desired, an adjuvant. Typically, the 
30 immunizing agent and/or adjuvant will be injected in the mammal by multiple subcutaneous 
or intraperitoneal injections. The immunizing agent may include a protein encoded by a 
nucleic acid of Tables 1 A- 16 or fragment thereof or a fusion protein thereof. It may be useful 
to conjugate the immunizing agent to a protein known to be immunogenic in the mammal 
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being immunized. Immunogenic proteins include, e.g., keyhole limpet hemocyanin, serum 
albumin, bovine thyroglobulin, and soybean trypsin inhibitor. Adjuvants include, e.g., 
Freund's complete adjuvant and MPL-TDM adjuvant (monophosphoryl Lipid A, synthetic 
trehalose dicorynomy colate) . The immunization protocol may be selected by one skilled in 
5 the art. 

The antibodies may, alternatively, be monoclonal antibodies. Monoclonal antibodies 
may be prepared using hybridoma methods, such as those described by Kohler and Milstein 
(1975) Nature 256:495. In a hybridoma method, a mouse, hamster, or other appropriate host 
animal, is typically immunized with an immunizing agent to elicit lymphocytes that produce 
10 or are capable of producing antibodies that will specifically bind to the immunizing agent. 
Alternatively, the lymphocytes may be immunized in vitro. The immunizing agent will 
typically include a polypeptide encoded by a nucleic acid of the tables, or fragment thereof, 
or a fusion protein thereof. Generally, either peripheral blood lymphocytes ("PBLs") are 
used if cells of human origin are desired, or spleen cells or lymph node cells are used if non- 
15 human mammalian sources are desired. The lymphocytes are then fused with an 

immortalized cell line using a suitable fusing agent, such as polyethylene glycol, to form a 
hybridoma cell (Goding (1986) Monoclonal Antibodies: Principles and Practice , pp. 59-103 ). 
Immortalized cell lines are usually transformed mammalian cells, particularly myeloma cells 
of rodent, bovin, or primate origin. Usually, rat or mouse myeloma cell lines are employed. 
20 The hybridoma cells may be cultured in a suitable culture medium that preferably contains 
one or more substances that inhibit the growth or survival of the unfused, immortalized cells. 
For example, if the parental cells lack the enzyme hypoxanthine guanine phosphoribosyl 
transferase (HGPRT or HPRT), the culture medium for the hybridomas typically will include 
hypoxanthine, aminopterin, and thymidine ("HAT medium"), which substances prevent the 
25 growth of HGPRT-deficient cells. 

In one embodiment, the antibodies are bispecific antibodies. Bispecific antibodies are 
typically monoclonal, preferably human or humanized, antibodies that have binding 
specificities for at least two different antigens or that have binding specificities for two 
epitopes on the same antigen. In one embodiment, one of the binding specificities is for a 
30 protein encoded by a nucleic acid of the tables or a fragment thereof, the other one is for any 
other antigen, and preferably for a cell-surface protein or receptor or receptor subunit, 
preferably one that is tumor specific. Alternatively, tetramer-type technology may create 
multivalent reagents. 
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In a preferred embodiment, the antibodies to lung cancer protein are capable of 
reducing or eliminating a biological function of a lung cancer protein, in a naked form or 
conjugated to an effector moiety. That is, the addition of anti-lung cancer protein antibodies 
(either polyclonal or preferably monoclonal) to lung cancer tissue (or cells containing lung 
5 cancer) may reduce or eliminate the lung cancer. Generally, at least a 25% decrease in 
activity, growth, size or the like is preferred, with at least about 50% being particularly 
preferred and about a 95-100% decrease being especially preferred. 

In a preferred embodiment the antibodies to the lung cancer proteins are humanized 
antibodies (e.g., Xenerex Biosciences, Medarex, Inc., Abgenix, Inc., Protein Design Labs, 

10 Inc.) Humanized forms of non-human (e.g., murine) antibodies are chimeric molecules of 
immunoglobulins, immunoglobulin chains or fragments thereof (such as Fv, Fab, Fab', 
F(ab')2 or other antigen-binding subsequences of antibodies) which contain minimal 
sequence derived from non-human immunoglobulin. Humanized antibodies include human 
immunoglobulins (recipient antibody) in which residues from a complementary determining 

1 5 region (CDR) of the recipient are replaced by residues from a CDR of a non-human species 
(donor antibody) such as mouse, rat or rabbit having the desired specificity, affinity and 
capacity. In some instances, Fv framework residues of a human immunoglobulin are 
replaced by corresponding non-human residues. Humanized antibodies may also comprise 
residues which are found neither in the recipient antibody nor in the imported CDR or 

20 framework sequences. In general, a humanized antibody will comprise substantially all of at 
least one, and typically two, variable domains, in which all or substantially all of the CDR 
regions correspond to those of a non-human immunoglobulin and all or substantially all of 
the framework (FR) regions are those of a human immunoglobulin consensus sequence. A 
humanized antibody optimally also will typically comprise at least a portion of an 

25 immunoglobulin constant region (Fc), typically that of a human immunoglobulin (Jones, et 
al. (1986) Nature 321:522-525; Riechmann, etal. (1988) Nature 332:323-329; andPresta 
(1992) Curr. Op. Struct. Biol. 2:593-596). Humanization can be performed following the 
method of Winter and co-workers (Jones, et al. (1986) Nature 321 :522-525; Riechmann, et al. 
(1988) Nature 332:323-327; Verhoeyen, et al. (1988) Science 239:1534-1536), by 

30 substituting rodent CDRs or CDR sequences for corresponding sequences of a human 

antibody. Accordingly, such humanized antibodies are chimeric antibodies (U.S. Patent No. 
4,816,567), wherein substantially less than an intact human variable domain has been 
substituted by corresponding sequence from a non-human species. 
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Human-like antibodies can also be produced using various techniques known in the 
art, including phage display libraries (Hoogenboom and Winter (1991) J. Mol. Bio l. 227:381; 
Marks, et al. (1991) J. Mol. Biol. 222:581). The techniques of Cole, et al. and Boerner, et al. 
are also available for the preparation of human monoclonal antibodies (Cole, et al. (1985) 
5 Monoclonal Antibodies and Cancer Therapy , p. 77 and Boerner, et al. (1991) J. Immunol. 
147(l):86-95). Similarly, human antibodies can be made by introducing human 
immunoglobulin loci into transgenic animals, e.g., mice in which the endogenous 
immunoglobulin genes have been partially or completely inactivated. Upon challenge, 
human antibody production is observed, which closely resembles that seen in humans in 

10 nearly all respects, including gene rearrangement, assembly, and antibody repertoire. This 
approach is described, e.g., in U.S. Patent Nos. 5,545,807; 5,545,806; 5,569,825; 5,625,126; 
5,633,425; 5,661,016, and in the following scientific publications: Marks, et al. (1992) 
Bio/Technology 10:779-783; Lonberg, et al. (1994) Nature 368:856-859; Morrison (1994) 
Nature 368:812-13; Fishwild, et al. (1996) Nature Biotechnology 14:845-51; Neuberger 

15 (1996) Nature Biotechnology 14:826; and Lonberg and Huszar (1995) Intern. Rev. Immunol. 
13:65-93. 

By immunotherapy is meant treatment of lung cancer with an antibody raised against 
a lung cancer proteins. As used herein, immunotherapy can be passive or active. Passive 
immunotherapy as defined herein is the passive transfer of antibody to a recipient (patient). 

20 Active immunization is the induction of antibody and/or T-cell responses in a recipient 

(patient). Induction of an immune response is the result of providing the recipient with an 
antigen to which antibodies are raised. The antigen may be provided by injecting a 
polypeptide against which antibodies are desired to be raised into a recipient, or contacting 
the recipient with a nucleic acid capable of expressing the antigen and under conditions for 

25 expression of the antigen, leading to an immune response. 

In a preferred embodiment the lung cancer proteins against which antibodies are 
raised are secreted proteins as described above. Without being bound by theory, antibodies 
used for treatment, may bind and prevent the secreted protein from binding to its receptor, 
thereby inactivating the secreted lung cancer protein. 

30 In another preferred embodiment, the lung cancer protein to which antibodies are 

raised is a transmembrane protein. Without being bound by theory, antibodies used for 
treatment may bind the extracellular domain of the lung cancer protein and prevent it from 
binding to other proteins, such as circulating ligands or cell-associated molecules. The 
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antibody may cause down-regulation of the transmembrane lung cancer protein. The 
antibody may be a competitive, non-competitive or uncompetitive inhibitor of protein binding 

•4 

to the extracellular domain of the lung cancer protein. The antibody may be an antagonist of 
the lung cancer protein or may prevent activation of a transmembrane lung cancer protein, or 
may induce or suppress a particular cellular pathway. In some embodiments, when the 
antibody prevents the binding of other molecules to the lung cancer protein, the antibody 
prevents growth of the cell. The antibody may also be used to target or sensitize the cell to 
cytotoxic agents, including, but not limited to TNF-oc, TNF-p, IL-1, INF-y, and IL-2, or 
chemotherapeutic agents including 5FU, vinblastine, actinomycin D, cisplatin, methotrexate, 
and the like. In some instances the antibody may belong to a sub-type that activates serum 
complement when complexed with the transmembrane protein thereby mediating cytotoxicity 
or antigen-dependent cytotoxicity (ADCC). Thus, lung cancer may be treated by 
administering to a patient antibodies directed against the transmembrane lung cancer protein. 
Antibody-labeling may activate a co-toxin, localize a toxin payload, or otherwise provide 
means to locally ablate cells. 

In another preferred embodiment, the antibody is conjugated to an effector moiety. 
The effector moiety can be various molecules, including labeling moieties such as radioactive 
labels or fluorescent labels, or can be a therapeutic moiety. In one aspect the therapeutic 
moiety is a small molecule that modulates the activity of a lung cancer protein. In another 
aspect the therapeutic moiety may modulate an activity of molecules associated with or in 
close proximity to a lung cancer protein. The therapeutic moiety may inhibit enzymatic or 
signaling activity such as protease or collagenase activity associated with lung cancer. 

In a preferred embodiment, the therapeutic moiety can also be a cytotoxic agent. In 
this method, targeting the cytotoxic agent to lung cancer tissue or cells results in a reduction 
in the number of afflicted cells, thereby reducing symptoms associated with lung cancer. 
Cytotoxic agents are numerous and varied and include, but are not limited to, cytotoxic drugs 
or toxins or active fragments of such toxins. Suitable toxins and their corresponding 
fragments include diphtheria A chain, exotoxin A chain, ricin A chain, abrin A chain, curcin, 
crotin, phenomycin, enomycin, saporin, auristatin, and the like. Cytotoxic agents also include 
radiochemicals made by conjugating radioisotopes to antibodies raised against lung cancer 
proteins, or binding of a radionuclide to a chelating agent that has been covalently attached to 
the antibody. Targeting the therapeutic moiety to transmembrane lung cancer proteins not 
only serves to increase the local concentration of therapeutic moiety in the lung cancer 
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afflicted area, but also serves to reduce deleterious side effects that may be associated with 
the untargeted therapeutic moiety. 

In another preferred embodiment, the lung cancer protein against which the antibodies 
are raised is an intracellular protein. In this case, the antibody may be conjugated to a protein 
5 or other entity which facilitates entry into the cell. In one case, the antibody enters the cell by 
endocytosis. In another embodiment, a nucleic acid encoding the antibody is administered to 
the individual or cell. Moreover, wherein the lung cancer protein can be targeted within a 
cell, i.e., the nucleus, an antibody theretomay contain a signal for that target localization, i.e., 
a nuclear localization signal. 
10 The lung cancer antibodies of the invention specifically bind to lung cancer proteins. 

By "specifically bind" herein is meant that the antibodies bind to the protein with a Kd of at 
least about 0.1 mM, more usually at least about 1 [iM, preferably at least about 0.1 [xM or 
better, and most preferably, 0.01 \xM or better. Selectivity of binding to the specific target 
and not to related other sequences is also important. 

15 

Detection of lung cancer sequence for diagnostic and therapeutic applications 

In one aspect, the RNA expression levels of genes are determined for different 
cellular states in the lung cancer phenotype. Expression levels of genes in normal tissue (e.g., 
not undergoing lung cancer), in lung cancer tissue (and in some cases, for varying severities 

20 of lung cancer that relate to prognosis, as outlined below), or in non-malignant disease are 
evaluated to provide expression profiles. A gene expression profile of a particular cell state 
or point of development is essentially a "fingerprint" of the state of the cell. While two states 
may have a particular gene similarly expressed, the evaluation of a number of genes 
simultaneously allows the generation of a gene expression profile that is reflective of the state 

25 of the cell. By comparing expression profiles of cells in different states, information 

regarding which genes are important (including both up- and down-regulation of genes) in 
each of these states is obtained. Then, diagnosis may be performed or confirmed to 
determine whether a tissue sample has the gene expression profile of normal or cancerous 
tissue. This will provide for molecular diagnosis of related conditions. 

30 "Differential expression," or grammatical equivalents as used herein, refers to 

qualitative or quantitative differences in the temporal and/or cellular gene expression 
patterns within and among cells and tissue. Thus, a differentially expressed gene can 
qualitatively have its expression altered, including an activation or inactivation, in, e.g., 
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normal versus lung cancer tissue. Genes may be turned on or turned off in a particular state, 
relative to another state thus permitting comparison of two or more states. A qualitatively 
regulated gene will exhibit an expression pattern within a state or cell type which is 
detectable by standard techniques. Some genes will be expressed in one state or cell type, but 
5 not in both. Alternatively, the difference in expression may be quantitative, e.g., in that 
expression is increased or decreased; i.e., gene expression is either upregulated, resulting in 
an increased amount of transcript, or downregulated, resulting in a decreased amount of 
transcript. The degree to which expression differs need only be large enough to quantify via 
standard characterization techniques as outlined below, such as by use of Affymetrix 

10 GeneChip™ expression arrays, Lockhart (1996) Nature Biotechnology 14: 1675-1680, hereby 
expressly incorporated by reference. Other techniques include, but are not limited to, 
quantitative reverse transcriptase PCR, northern analysis and RNase protection. As outlined 
above, preferably the change in expression (i.e., upregulation or downregulation) is typically 
at least about 50%, more preferably at least about 100%, more preferably at least about 

15 150%, more preferably at least about 200%, with from 300 to at least 1000% being especially 
preferred. 

Evaluation may be at the gene transcript or the protein level. The amount of gene 
expression may be monitored using nucleic acid probes to the RNA or DNA equivalent of the 
gene transcript, and the quantification of gene expression levels, or, alternatively, the final 

20 gene product itself (protein) can be monitored, e.g., with antibodies to the lung cancer protein 
and standard immunoassays (ELISAs, etc.) or other techniques, including mass spectroscopy 
assays, 2D gel electrophoresis assays, etc. Proteins corresponding to lung cancer genes, e.g., 
those identified as being important in a lung cancer or disease phenotype, can be evaluated in 
a lung cancer diagnostic test. In a preferred embodiment, gene expression monitoring is 

25 performed simultaneously on a number of genes. 

The lung cancer nucleic acid probes may be attached to biochips as outlined herein for 
the detection and quantification of lung cancer sequences in a particular cell. The assays are 
further described below in the example. PCR techniques can be used to provide greater 
sensitivity. Multiple protein expression monitoring can be performed as well. Similarly, 

30 these assays may be performed on an individual basis as well. 

In a preferred embodiment nucleic acids encoding the lung cancer protein are 
detected. Although DNA or RNA encoding the lung cancer protein may be detected, of 
particular interest are methods wherein an mRNA encoding a lung cancer protein is detected. 
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Probes to detect mRNA can be a nucleotide/deoxynucleotide probe that is complementary to 
and hybridizes with the mRNA and includes, but is not limited to, oligonucleotides, cDNA or 
RNA. Probes also should contain a detectable label, as defined herein. In one method the 
mRNA is detected after immobilizing the nucleic acid to be examined on a solid support such 
5 as nylon membranes and hybridizing the probe with the sample. Following washing to 

remove the non-specifically bound probe, the label is detected. In another method detection 
of the mRNA is performed in situ. In this method permeabilized cells or tissue samples are 
contacted with a detectably labeled nucleic acid probe for sufficient time to allow the probe 
to hybridize with the target mRNA. Following washing to remove the non-specifically bound 

10 probe, the label is detected. For example a digoxygenin labeled riboprobe (RNA probe) that 
is complementary to the mRNA encoding a lung cancer protein is detected by binding the 
digoxygenin with an anti-digoxygenin secondary antibody and developed with nitro blue 
tetrazolium and 5 -bromo-4-chloro -3 -indoyl phosphate. 

In a preferred embodiment, various proteins from the three classes of proteins as 

15 described herein (secreted, transmembrane or intracellular proteins) are used in diagnostic 
assays. The lung cancer proteins, antibodies, nucleic acids, modified proteins and cells 
containing lung cancer sequences are used in diagnostic assays. This can be performed on an 
individual gene or corresponding polypeptide level. In a preferred embodiment, the 
expression profiles are used, preferably in conjunction with high throughput screening 

20 techniques to allow monitoring for expression profile genes and/or corresponding 
polypeptides. 

As described and defined herein, lung cancer proteins, including intracellular, 
transmembrane, or secreted proteins, find use as markers of lung cancer, e.g., for prognostic 
or diagnostic purposes. Detection of these proteins in putative lung cancer tissue allows for 

25 detection, prognosis, or diagnosis of lung cancer or similar disease, and perhaps for selection 
of therapeutic strategy. In one embodiment, antibodies are used to detect lung cancer 
proteins. A preferred method separates proteins from a sample by electrophoresis on a gel 
(typically a denaturing and reducing protein gel, but may be another type of gel, including 
isoelectric focusing gels and the like). Following separation of proteins, the lung cancer 

30 protein is detected, e.g., by immunoblotting with antibodies raised against the lung cancer 
protein. Methods of immunoblotting are well known to those of ordinary skill in the art. 

In another preferred method, antibodies to the lung cancer protein find use in in situ 
imaging techniques, e.g., in histology (e.g., Asai (ed. 1993) Methods in Cell Biology: 
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Antibodies in Cell Biology , volume 37. In this method cells are contacted with from one to 
many antibodies to the lung cancer protein(s). Following washing to remove non-specific 
antibody binding, the presence of the antibody or antibodies is detected. In one embodiment 
the antibody is detected by incubating with a secondary antibody that contains a detectable 
5 label, e.g., multicolor fluorescence or confocal imaging. In another method the primary 

antibody to the lung cancer protein(s) contains a detectable label, e.g., an enzyme marker that 
can act on a substrate. In another preferred embodiment each one of multiple primary 
antibodies contains a distinct and detectable label. This method finds particular use in 
simultaneous screening for a plurality of lung cancer proteins. Many other histological 

1 0 imaging techniques are also provided by the invention. 

In a preferred embodiment the label is detected in a fluorometer which has the ability 
to detect and distinguish emissions of different wavelengths. In addition, a fluorescence 
activated cell sorter (FACS) can be used in the method. 

In another preferred embodiment, antibodies find use in diagnosing lung cancer from 

15 blood, serum, plasma, stool, and other samples. Such samples, therefore, are useful as 

samples to be probed or tested for the presence of lung cancer proteins. Antibodies can be 
used to detect a lung cancer protein by previously described immunoassay techniques 
including ELIS A, immunoblotting (western blotting), immunoprecipitation, BIACORE 
technology and the like. Conversely, the presence of antibodies may indicate an immune 

20 response against an endogenous lung cancer protein or vaccine. 

In a preferred embodiment, in situ hybridization of labeled lung cancer nucleic acid 
probes to tissue arrays is done. For example, arrays of tissue samples, including lung cancer 
tissue and/or normal tissue, are made. In situ hybridization (see, e.g., Ausubel, supra) is then 
performed. When comparing the fingerprints between an individual and a standard, the 

25 skilled artisan can make a diagnosis, a prognosis, or a prediction based on the findings. It is 
further understood that the genes which indicate the diagnosis may differ from those which 
indicate the prognosis and molecular profiling of the condition of the cells may lead to 
distinctions between responsive or refractory conditions or may be predictive of outcomes. 
In a preferred embodiment, the lung cancer proteins, antibodies, nucleic acids, 

30 modified proteins and cells containing lung cancer sequences are used in prognosis assays. 
As above, gene expression profiles can be generated that correlate to lung cancer, clinical, 
pathological, or other information, in terms of long term prognosis. Again, this may be done 
on either a protein or gene level, with the use of genes being preferred. Single or multiple 
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genes may be useful in various combinations. As above, lung cancer probes may be attached 
to biochips for the detection and quantification of lung cancer sequences in a tissue or patient. 
The assays proceed as outlined above for diagnosis. PCR method may provide more 
sensitive and accurate quantification. 

5 

Assays for therapeutic compounds 

In a preferred embodiment, the proteins, nucleic acids, and antibodies as described 
herein are used in drug screening assays. The lung cancer proteins, antibodies, nucleic acids, 
modified proteins and cells containing lung cancer sequences are used in drug screening 

10 assays or by evaluating the effect of drug candidates on a "gene expression profile" or 

expression profile of polypeptides. In a preferred embodiment, the expression profiles are 
used, preferably in conjunction with high throughput screening techniques to allow 
monitoring for expression profile genes after treatment with a candidate agent (e.g., 
Zlokamik, et al. (1998) Science 279:84-8; Heid (1996) Genome Res. 6:986-94. 

15 In a preferred embodiment, the lung cancer proteins, antibodies, nucleic acids, 

modified proteins and cells containing the native or modified lung cancer proteins are used in 
screening assays. That is, the present invention provides novel methods for screening for 
compositions which modulate the lung cancer phenotype or an identified physiological 
function of a lung cancer protein. As above, this can be done on an individual gene level or 

20 by evaluating the effect of drug candidates on a "gene expression profile". In a preferred 

embodiment, the expression profiles are used, preferably in conjunction with high throughput 
screening techniques to allow monitoring for expression profile genes after treatment with a 
candidate agent, see Zlokarnik, supra. 

Having identified differentially expressed genes herein, a variety of assays may be 

25 performed. In a preferred embodiment, assays may be run on an individual gene or protein 
level. That is, having identified a particular gene with altered regulation in lung cancer, test 
compounds can be screened for the ability to modulate gene expression or for binding to the 
lung cancer protein. "Modulation" thus includes an increase or a decrease in gene 
expression. The preferred amount of modulation will depend on the original change of the 

30 gene expression in normal versus tissue undergoing lung cancer, with changes of at least 

10%, preferably 50%, more preferably 100-300%, and in some embodiments 300-1000% or 
greater. Thus, if a gene exhibits a 4-fold increase in lung cancer tissue compared to normal 
tissue, a decrease of about four-fold is often desired; similarly, a 10-fold decrease in lung 
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cancer tissue compared to normal tissue often provides a target value of a 10-fold increase in 
expression to be induced by the test compound. 

The amount of gene expression may be monitored using nucleic acid probes and the 
quantification of gene expression levels, or, alternatively, the gene product itself can be 
5 monitored, e.g., through the use of antibodies to the lung cancer protein and standard 
immunoassays. Proteomics and separation techniques may also allow quantification of 
expression. 

In a preferred embodiment, gene or protein expression monitoring of a number of 
entities, i.e., an expression profile, is monitored simultaneously. Such profiles will typically 
1 0 involve a plurality of those entities described herein. 

In this embodiment, the lung cancer nucleic acid probes are attached to biochips as 
outlined herein for the detection and quantification of lung cancer sequences in a particular 
cell. Alternatively, PGR may be used. Thus, a series, e.g., of microtiter plate, may be used 
with dispensed primers in desired wells. A PGR reaction can then be performed and analyzed 
1 5 for each well. 

Expression monitoring can be performed to identify compounds that modify the 
expression of one or more lung cancer-associated sequences, e.g., a polynucleotide sequence 
set out in the tables. Generally, in a preferred embodiment, a test compound is added to the 
cells prior to analysis. Moreover, screens are also provided to identify agents that modulate 

20 lung cancer, modulate lung cancer proteins, bind to a lung cancer protein, or interfere with 
the binding of a lung cancer protein and an antibody, substrate, or other binding partner. 

The term "test compound" or "drug candidate" or "modulator" or grammatical 
equivalents as used herein describes a molecule, e.g., protein, oligopeptide, small organic 
molecule, polysaccharide, polynucleotide, etc., to be tested for the capacity to directly or. 

25 indirectly alter the lung cancer phenotype or the expression of a lung cancer sequence, e.g., a 
nucleic acid or protein sequence. In preferred embodiments, modulators alter expression 
profiles of nucleic acids or proteins provided herein. In one embodiment, the modulator 
suppresses a lung cancer phenotype, e.g., to a normal or non-malignant tissue fingerprint. In 
another embodiment, a modulator induces a lung cancer phenotype. Generally, a plurality of 

30 assay mixtures are run in parallel with different agent concentrations to obtain a differential 
' response to the various concentrations. Typically, one of these concentrations serves as a 
negative control, i.e., at zero concentration or below the level of detection. 
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In one aspect, a modulator will neutralize the effect of a lung cancer protein. By 
"neutralize" is meant that activity of a protein and the consequent effect on the cell is 
inhibited or blocked. 

In certain embodiments, combinatorial libraries of potential modulators will be 
5 screened for an ability to bind to a lung cancer polypeptide or to modulate activity. 

Conventionally, new chemical entities with useful properties are generated by identifying a 
chemical compound (called a "lead compound") with some desirable property or activity, 
e.g., inhibiting activity, creating variants of the lead compound, and evaluating the property 
and activity of those variant compounds. Often, high throughput screening (HTS) methods 

10 are employed for such an analysis. 

In one preferred embodiment, high throughput screening methods involve providing a 
library containing a large number of potential therapeutic compounds (candidate 
compounds). Such "combinatorial chemical libraries" are then screened in one or more 
assays to identify those library members (particular chemical species or subclasses) that 

15 display a desired characteristic activity. The compounds thus identified can serve as 

conventional "lead compounds" or can themselves be used as potential or actual therapeutics. 

A combinatorial chemical library is a collection of diverse chemical compounds 
generated by either chemical synthesis or biological synthesis by combining a number of 
chemical "building blocks" such as reagents. For example, a linear combinatorial chemical 

10 library, such as a polypeptide (e.g., mutein) library, is formed by combining a set of chemical 
building blocks called amino acids in every possible way for a given compound length (i.e., 
the number of amino acids in a polypeptide compound). Millions of chemical compounds 
can be synthesized through such combinatorial mixing of chemical building blocks (Gallop, 
et al. (1994) J. Med. Chem. 37(9):1233-1251). 

15 Preparation and screening of combinatorial chemical libraries is well known to those 

of skill in the art. Such combinatorial chemical libraries include, but are not limited to, 
peptide libraries (see, e.g., U.S. Patent No. 5,010,175, Furka (1991) Pept. Prot. Res. 37:487- 
493, Houghton, et al. (1991) Nature . 354:84-88), peptoids (PCT Publication No WO 
91/19735), encoded peptides (PCT Publication WO 93/20242), random bio-oligomers (PCT 

10 Publication WO 92/00091), benzodiazepines (U.S. Pat. No. 5,288,5 14), diversomers such as 
hydantoins, benzodiazepines and dipeptides (Hobbs, et al. (1993) Proc. Nat. Acad. Sci. USA 
90:6909-6913), vinylogous polypeptides (Hagihara, et al. (1992) J. Amer. Chem. Soc. 
114:6568), nonpeptidal peptidomimetics with a Beta-D-Glucose scaffolding (Hirschmann, et 
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al. (1992) J. Amer. Chem. Soc. 114:9217-9218), analogous organic syntheses of small 
compound libraries (Chen, et al. (1994) J. Amer. Chem. Soc. 116:2661), oligocarbamates 
(Cho, et al. (1993) Science 261 :1303), and/or peptidyl phosphonates (Campbell, et al. (1994) 
J. Org. Chem. 59:658). See, generally, Gordon, et al. (1994) J. Med. Chem. 37:1385, nucleic 
5 acid libraries (see, e.g., Stratagene, Corp.), peptide nucleic acid libraries (see, e.g., U.S. 

Patent 5,539,083), antibody libraries (see, e.g., Vaughn, et al. (1996) Nature Biotechnology 
14(3):309-314, and PCTYUS96/10287), carbohydrate libraries (see, e.g., Liang, et al. (1996) 
Science 274:1520-1522, and U.S. Patent No. 5,593,853), and small organic molecule libraries 
(see, e.g., benzodiazepines, Baum (1993) C&EN, Jan 18, page 33; isoprenoids, U.S. Patent 

10 No. 5,569,588; thiazolidinones and metathiazanones, U.S. Patent No. 5,549,974; pyrrolidines, 
U.S. Patent Nos. 5,525,735 and 5,519,134; morpholino compounds, U.S. Patent No. 
5,506,337; benzodiazepines, U.S. Patent No. 5,288,514; and the like). 

Devices for the preparation of combinatorial libraries are commercially available (see, 
e.g., 357 MPS, 390 MPS, Advanced Chem Tech, Louisville KY, Symphony, Rainin, 

15 Woburn, MA, 433 A Applied Biosystems, Foster City, CA, 9050 Plus, Millipore, Bedford, 
MA). 

A number of well known robotic systems have also been developed for solution phase 
chemistries. These systems include automated workstations like the automated synthesis 
apparatus developed by Takeda Chemical Industries, LTD. (Osaka, Japan) and many robotic 

20 systems utilizing robotic arms (Zymate II, Zymark Corporation, Hopkinton, Mass.; Orca, 

Hewlett-Packard, Palo Alto, Calif), which mimic the manual synthetic operations performed 
by a chemist. The above devices, with appropriate modification, are suitable for use with the 
present invention. In addition, numerous combinatorial libraries are themselves 
commercially available (see, e.g., ComGenex, Princeton, N.J., Asinex, Moscow, Ru, Tripos, 

25 Inc., St. Louis, MO, ChemStar, Ltd, Moscow, RU, 3D Pharmaceuticals, Exton, PA, Martek 
Biosciences, Columbia, MD, etc.). 

The assays to identify modulators are amenable to high throughput screening. 
Preferred assays thus detect modulation of lung cancer gene transcription, polypeptide 
expression, and polypeptide activity. 

30 High throughput assays for evaluating the presence, absence, quantification, or other 

properties of particular nucleic acids or protein products are well known to those of skill in 
the art. Similarly, binding assays and reporter gene assays are similarly well known. Thus, 
e.g., U.S. Patent No. 5,559,410 discloses high throughput screening methods for proteins, 
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U.S. Patent No. 5,585,639 discloses high throughput screening methods for nucleic acid 
binding (i.e., in arrays), while U.S. Patent Nos. 5,576,220 and 5,541,061 disclose high 
throughput methods of screening for ligand/antibody binding. 

In addition, high throughput screening systems are commercially available (see, e.g., 
5 Zymark Corp., Hopkinton, MA; Air Technical Industries, Mentor, OH; Beckman 

Instruments, Inc. Fullerton, CA; Precision Systems, Inc., Natick, MA, etc.). These systems 
typically automate procedures, including sample and reagent pipetting, liquid dispensing, 
timed incubations, and final readings of the microplate in detector(s) appropriate for the 
assay. These configurable systems provide high throughput and rapid start up as well as a 

1 0 high degree of flexibility and customization. The manufacturers of such systems provide 
detailed protocols for various high throughput systems. Thus, e.g., Zymark Corp. provides 
technical bulletins describing screening systems for detecting the modulation of gene 
transcription, ligand binding, and the like. 

In one embodiment, modulators are proteins, often naturally occurring proteins or 

15 fragments of naturally occurring proteins. Thus, e.g., cellular extracts containing proteins, or 
random or directed digests of proteinaceous cellular extracts, may be used. In this way 
libraries of proteins may be made for screening in the methods of the invention. Particularly 
preferred in this embodiment are libraries of bacterial, fungal, viral, and mammalian proteins, 
with the latter being preferred, and human proteins being especially preferred. Particularly 

20 useful test compound will be directed to the class of proteins to which the target belongs, e.g., 
substrates for enzymes or ligands and receptors. 

In a preferred embodiment, modulators are peptides of from about 5 to about 30 
amino acids, with from about 5 to about 20 amino acids being preferred, and from about 7 to 
about 15 being particularly preferred. The peptides may be digests of naturally occurring 

25 proteins, random peptides, or "biased" random peptides. By "randomized" or grammatical 
equivalents herein is meant that the nucleic acid or peptide consists of essentially random 
sequences of nucleotides and amino acids, respectively. Since these random peptides (or 
nucleic acids, discussed below) are often chemically synthesized, they may incorporate a 

* 

nucleotide or amino acid at any position. The synthetic process can be designed to generate 
30 randomized proteins or nucleic acids, to allow the formation of all or most of the possible 

combinations over the length of the sequence, thus forming a library of randomized candidate 
bioactive proteinaceous agents. 
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In one embodiment, the library is fully randomized, with no sequence preferences or 
constants at any position. In a preferred embodiment, the library is biased. That is, some 
positions within the sequence are either held constant, or are selected from a limited number 
of possibilities. In a preferred embodiment, the nucleotides or amino acid residues are 
5 randomized within a defined class, e.g., of hydrophobic amino acids, hydrophilic residues, 
sterically biased (either small or large) residues, towards the creation of nucleic acid binding 
domains, the creation of cysteines, for cross-linking, prolines for SH-3 domains, serines, 
threonines, tyrosines or histidines for phosphorylation sites, etc. 

Modulators of lung cancer can also be nucleic acids, as defined above. 

10 As described above generally for proteins, nucleic acid modulating agents may be 

naturally occurring nucleic acids, random nucleic acids, or "biased" random nucleic acids. 
Digests of procaryotic or eucaryotic genomes may be used as is outlined above for proteins. 

In a preferred embodiment, the candidate compounds are organic chemical moieties, a 
wide variety of which are available in the literature. 

15 After a candidate agent has been added and the cells allowed to incubate for some 

period of time, the sample containing a target sequence is analyzed. If required, the target 
sequence is prepared using known techniques. For example, the sample may be treated to 
lyse the cells, using known lysis buffers, electroporation, etc., with purification and/or 
amplification such as PGR performed as appropriate. For example, an in vitro transcription 

20 with labels covalently attached to the nucleotides is performed. Generally, the nucleic acids 
are labeled with biotin-FITC or PE, or with cy3 or cy5. 

In a preferred embodiment, the target sequence is labeled with, e.g., a fluorescent, a 
chemiluminescent, a chemical, or a radioactive signal, to provide a means of detecting the 
target sequence's specific binding to a probe. The label also can be an enzyme, such as, 

25 alkaline phosphatase or horseradish peroxidase, which when provided with an appropriate 
substrate produces a product that can be detected. Alternatively, the label can be a labeled 
compound or small molecule, such as an enzyme inhibitor, that binds but is not catalyzed or 
altered by the enzyme. The label also can be a moiety or compound, such as, an epitope tag 
or biotin which specifically binds to streptavidin. For the example of biotin, the streptavidin 

30 is labeled as described above, thereby, providing a detectable signal for the bound target 
sequence. Unbound labeled streptavidin is typically removed prior to analysis. 

Nucleic acid assays can be direct hybridization assays or can comprise "sandwich 
assays", which include the use of multiple probes, as is generally outlined in U.S. Patent Nos. 
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5,681,702, 5,597,909, 5,545,730, 5,594,117, 5,591,584, 5,571,670, 5,580,731, 5,571,670, 
5,591,584, 5,624,802, 5,635,352, 5,594,118, 5,359,100, 5,124,246 and 5,681,697, all of 
which are hereby incorporated by reference. In this embodiment, in general, the target nucleic 
acid is prepared as outlined above, and then added to the biochip comprising a plurality of 
5 nucleic acid probes, under conditions that allow the formation of a hybridization complex. 

A variety of hybridization conditions may be used in the present invention, including 
high, moderate and low stringency conditions as outlined above. The assays are generally 
run under stringency conditions which allow formation of the label probe hybridization 
complex only in the presence of target. Stringency can be controlled by altering a step 

10 parameter that is a thermodynamic variable, including, but not limited to, temperature, 
formamide concentration, salt concentration, chaotropic salt concentration, pH, organic 
solvent concentration, etc. 

These parameters may also be used to control non-specific binding, as is generally 
outlined in U.S. Patent No. 5,681,697: Thus it may be desirable to perform certain steps at 

1 5 higher stringency conditions to reduce non-specific binding. 

The reactions outlined herein may be accomplished in a variety of ways. Components 
of the reaction may be added simultaneously, or sequentially, in different orders, with 
preferred embodiments outlined below. In addition, the reaction may include a variety of 
other reagents. These include salts, buffers, neutral proteins, e.g., albumin, detergents, etc. 

20 which may be used to facilitate optimal hybridization and detection, and/or reduce non- 
specific or background interactions. Reagents that otherwise improve the efficiency of the 
assay, such as protease inhibitors, nuclease inhibitors, anti-microbial agents, etc., may also be 
used as appropriate, depending on the sample preparation methods and purity of the target. 
The assay data are analyzed to determine the expression levels, and changes in 

25 expression levels as between states, of individual genes, forming a gene expression profile. 

Screens are performed to identify modulators of the lung cancer phenotype. In one 
embodiment, screening is performed to identify modulators that can induce or suppress a 
particular expression profile, thus preferably generating the associated phenotype. In another 
embodiment, e.g., for diagnostic applications, having identified differentially expressed genes 

30 important in a particular state, screens can be performed to identify modulators that alter 

expression of individual genes. In an another embodiment, screening is performed to identify 
modulators that alter a biological function of the expression product of a differentially 
expressed gene. Again, having identified the importance of a gene in a particular state, 
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screens are performed to identify agents that bind and/or modulate the biological activity of 
the gene product, or evaluate genetic polymorphisms. 

Genes can be screened for those that are induced in response to a candidate agent. 
After identifying a modulator based upon its ability to suppress a lung cancer expression 
5 pattern leading to a normal expression pattern, or to modulate a single lung cancer gene 
expression profile so as to mimic the expression of the gene from normal tissue, a screen as 
described above can be performed to identify genes that are specifically modulated in 
response to the agent. Comparing expression profiles between normal tissue and agent 
treated lung cancer tissue reveals genes that are not expressed in normal tissue or lung cancer 

10 tissue, but are expressed in agent treated tissue. These agent- specific sequences can be 
identified and used by methods described herein for lung cancer genes or proteins. In 
particular these sequences and the proteins they encode find use in marking or identifying 
agent treated cells. In addition, antibodies can be raised against the agent induced proteins 
and used to target novel therapeutics to the treated lung cancer tissue sample. 

15 Thus, in one embodiment, a test compound is administered to a population of lung 

cancer cells, that have an associated lung cancer expression profile. By "administration" or 
"contacting" herein is meant that the candidate agent is added to the cells in such a manner as 
to allow the agent to act upon the cell, whether by uptake and intracellular action, or by 
action at the cell surface. In some embodiments, nucleic acid encoding a proteinaceous 

20 candidate agent (i.e., a peptide) may be put into a viral construct such as an adenoviral or 
retroviral construct, and added to the cell, such that expression of the peptide agent is 

» 

accomplished, e.g., PCT US97/01019; Regulatable gene therapy systems can also be used. 

Once a test compound has been administered to the cells, the cells can be washed if 
desired and are allowed to incubate under preferably physiological conditions for some 
25 period of time. The cells are then harvested and a new gene expression profile is generated, 
as outlined herein. 

Thus, e.g., lung cancer or non-malignant tissue may be screened for agents that 
modulate, e.g., induce or suppress a lung cancer phenotype. A change in at least one gene, 
preferably many, of the expression profile indicates that the agent has an effect on lung 
30 cancer activity. By defining such a signature for the lung cancer phenotype, screens for new 
drugs that alter the phenotype can be devised. With this approach, the drug target need not be 
known and need not be represented in the original expression screening platform, nor does 
the level of transcript for the target protein need to change. 
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Measure of lung cancer polypeptide activity, or of lung cancer or the lung cancer 
phenotype can be performed using a variety of assays. For example, the effects of the test 
compounds upon the function of the metastatic polypeptides can be measured by examining 
parameters described above. A suitable physiological change that affects activity can be used 
5 to assess the influence of a test compound on the polypeptides of this invention. When the 
functional consequences are determined using intact cells or animals, one can also measure a 
variety of effects such as, in the case of lung cancer associated with tumors, tumor growth, 
tumor metastasis, neovascularization, hormone release, transcriptional changes to both known 
and uncharacterized genetic markers (e.g., northern blots), changes in cell metabolism such as 

10 cell growth or pH changes, and changes in intracellular second messengers such as cGMP. In 
the assays of the invention, mammalian lung cancer polypeptide is typically used, e.g., 
mouse, preferably human. 

Assays to identify compounds with modulating activity can be performed in vitro. 
For example, a lung cancer polypeptide is first contacted with a potential modulator and 

15 incubated for a suitable amount of time, e.g., from 0.5 to 48 hours. In one embodiment, the 
lung cancer polypeptide levels are determined in vitro by measuring the level of protein or 
mRNA. The level of protein is typically measured using immunoassays such as western 
blotting, ELISA and the like with an antibody that selectively binds to the lung cancer 
polypeptide or a fragment thereof. For measurement of mRNA, amplification, e.g., using 

20 PGR, LCR, or hybridization assays, e.g., northern hybridization, RNAse protection, dot 

blotting, are preferred. The level of protein or mRNA is typically detected using directly or 
indirectly labeled detection agents, e.g., fluorescently or radioactively labeled nucleic acids, 
radioactively or enzymatically labeled antibodies, and the like, as described herein. 

Alternatively, a reporter gene system can be devised using a lung cancer protein 

25 promoter operably linked to a reporter gene such as luciferase, green fluorescent protein, 
CAT, or P-gal. The reporter construct is typically transfected into a cell. After treatment 
with a potential modulator, the amount of reporter gene transcription, translation, or activity 
is measured according to standard techniques known to those of skill in the art. 

In a preferred embodiment, as outlined above, screens may be done on individual 

* 

30 genes and gene products (proteins). That is, having identified a particular differentially 

expressed gene as important in a particular state, screening of modulators of the expression of 
the gene or the gene product itself can be done. The gene products of differentially expressed 
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genes are sometimes referred to herein as "lung cancer proteins." The lung cancer protein 

» 

may be a fragment, or alternatively, be the full length protein to a fragment shown herein. 

In one embodiment, screening for modulators of expression of specific genes is 
performed. Typically, the expression of only one or a few genes are evaluated. In another 
5 embodiment, screens are designed to first find compounds that bind to differentially 
expressed proteins. These compounds are then evaluated for the ability to modulate 
differentially expressed activity. Moreover, once initial candidate compounds are identified, 
variants can be further screened to better evaluate structure activity relationships. 

In a preferred embodiment, binding assays are done. In general, purified or isolated 
1 0 gene product is used; that is, the gene products of one or more differentially expressed 

nucleic acids are made. For example, antibodies are generated to the protein gene products, 
and standard immunoassays are run to determine the amount of protein present. Alternatively, 
cells comprising the lung cancer proteins can be used in the assays. 

Thus, in a preferred embodiment, the methods comprise combining a lung cancer 
1 5 protein and a candidate compound, and determining the binding of the compound to the lung 
cancer protein. Preferred embodiments utilize the human lung cancer protein, although other 
mammalian proteins may also be used, e.g., for the development of animal models of human 
disease. In some embodiments, as outlined herein, variant or derivative lung cancer proteins 
may be used. 

20 Generally, in a preferred embodiment of the methods herein, the lung cancer protein 

or the candidate agent is non-diffusably bound to an insoluble support, preferably having 
isolated sample receiving areas (e.g., a microtiter plate, an array, etc.). The insoluble 
supports may be made of a composition to which the compositions can be bound, is readily 
separated from soluble material, and is otherwise compatible with the overall method of 

25 screening. The surface of such supports may be solid or porous and of a convenient shape. 
Examples of suitable insoluble supports include microtiter plates, arrays, membranes and 
beads. These are typically made of glass, plastic (e.g., polystyrene), polysaccharides, nylon 
or nitrocellulose, teflon™, etc. Microtiter plates and arrays are especially convenient because 
a large number of assays can be carried out simultaneously, using small amounts of reagents 

30 and samples. The particular manner of binding of the composition is typically not crucial so 
long as it is compatible with the reagents and overall methods of the invention, maintains the 
activity of the composition, and is nondiffusable. Preferred methods of binding include the 
use of antibodies (which do not sterically block either the ligand binding site or activation 
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sequence when the protein is bound to the support), direct binding to "sticky" or ionic 
supports, chemical crosslinking, the synthesis of the protein or agent on the surface, etc. 
Following binding of the protein or agent, excess unbound material is removed by washing. 
The sample receiving areas may then be blocked through incubation with bovine serum 
albumin (BSA), casein or other innocuous protein or other moiety. 

In a preferred embodiment, the lung cancer protein is bound to the support, and a test 
compound is added to the assay. Alternatively, the candidate agent is bound to the support 
and the lung cancer protein is added. Novel binding agents include specific antibodies, non- 
natural binding agents identified in screens of chemical libraries, peptide analogs, etc. Of 
particular interest are screening assays for agents that have a low toxicity for human cells. A 
wide variety of assays may be used for this purpose, including labeled in vitro protein-protein 
binding assays, electrophoretic mobility shift assays, immunoassays for protein binding, 
functional assays (phosphorylation assays, etc.) and the like. 

The determination of the binding of the test modulating compound to the lung cancer 
protein may be done in a number of ways. In a preferred embodiment, the compound is 
labeled, and binding determined directly, e.g., by attaching all or a portion of the lung cancer 
protein to a solid support, adding a labeled candidate agent (e.g., a fluorescent label), washing 
off excess reagent, and determining whether the label is present on the solid support. Various 
blocking and washing steps may be utilized as appropriate. 

In some embodiments, only one of the components is labeled, e.g., the proteins (or 
proteinaceous candidate compounds) can be labeled. Alternatively, more than one 
component can be labeled with different labels, e.g., 125 I for the proteins and a fluorophor for 
the compound. Proximity reagents, e.g., quenching or energy transfer reagents are also 
useful. 

In one embodiment, the binding of the test compound is determined by competitive 
binding assay. The competitor may be a binding moiety known to bind to the target molecule 
(i.e., a lung cancer protein), such as an antibody, peptide, binding partner, ligand, etc. Under 
certain circumstances, there may be competitive binding between the compound and the 
binding moiety, with the binding moiety displacing the compound. In one embodiment, the 
test compound is labeled. Either the compound, or the competitor, or both, is added first to 
the protein for a time sufficient to allow binding, if present. Incubations may be performed at 
a temperature which facilitates optimal activity, typically between 4 and 40° C. Incubation 
periods are typically optimized, e.g., to facilitate rapid high throughput screening. Typically 



65 



WO 02/086443 PCT/US02/12476 

between 0. 1 and 1 hour will be sufficient. Excess reagent is generally removed or washed 
away. The second component is then added, and the presence or absence of the labeled 
component is followed, to indicate binding. 

In a preferred embodiment, the competitor is added first, followed by a test 
5 compound. Displacement of the competitor is an indication that the test compound is binding 
to the lung cancer protein and thus is capable of binding to, and potentially modulating, the 
activity of the lung cancer protein. In this embodiment, either component can be labeled. 
Thus, e.g., if the competitor is labeled, the presence of label in the wash solution indicates 
displacement by the agent. Alternatively, if the test compound is labeled, the presence of the 

1 0 label on the support indicates displacement. 

In an alternative embodiment, the test compound is added first, with incubation and 
washing, followed by the competitor. The absence of binding by the competitor may indicate 
that the test compound is bound to the lung cancer protein with a higher affinity. Thus, if the 
test compound is labeled, the presence of the label on the support, coupled with a lack of ► 

15 competitor binding, may indicate that the test compound is capable of binding to the lung 
cancer protein. 

In a preferred embodiment, the methods comprise differential screening to identity 
agents that are capable of modulating the activity of the lung cancer proteins. In one 
embodiment, the methods comprise combining a lung cancer protein and a competitor in a 

20 first sample. A second sample comprises a test compound, a lung cancer protein, and a 

competitor. The binding of the competitor is determined for both samples, and a change, or 
difference in binding between the two samples indicates the presence of an agent capable of 
binding to the lung cancer protein and potentially modulating its activity. That is, if the 
binding of the competitor is different in the second sample relative to the first sample, the 

25 agent is capable of binding to the lung cancer protein. 

Alternatively, differential screening is used to identify drug candidates that bind to the 
native lung cancer protein, but cannot bind to modified lung cancer proteins. The structure of 
the lung cancer protein may be modeled, and used in rational drug design to synthesize agents 
that interact with that site. Drug candidates that affect the activity of a lung cancer protein 

30 are also identified by screening drugs for the ability to either enhance or reduce the activity of 
the protein. 

Positive controls and negative controls may be used in the assays. Preferably control 
and test samples are performed in at least triplicate to obtain statistically significant results. 
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Incubation of all samples is for a time sufficient for the binding of the agent to the protein. 
Following incubation, samples are washed free of non-specifically bound material and the 
amount of bound, generally labeled agent determined. For example, where a radiolabel is 
employed, the samples may be counted in a scintillation counter to determine the amount of 
5 bound compound. 

A variety of other reagents may be included in the screening assays. These include 
reagents like salts, neutral proteins, e.g., albumin, detergents, etc. which may be used to 
facilitate optimal protein-protein binding and/or reduce non-specific or background 
interactions. Also reagents that otherwise improve the efficiency of the assay, such as 
10 protease inhibitors, nuclease inhibitors, anti-microbial agents, etc., may be used. The mixture 
of components may be added in an order that provides for the requisite binding. 

In a preferred embodiment, the invention provides methods for screening for a 
compound capable of modulating the activity of a lung cancer protein. The methods 
comprise adding a test compound, as defined above, to a cell comprising lung cancer 
15 proteins. Preferred cell types include almost any cell. The cells contain a recombinant 
nucleic acid that encodes a lung cancer protein. In a preferred embodiment, a library of 
candidate agents are tested on a plurality of cells. 

In one aspect, the assays are evaluated in the presence or absence or previous or 
subsequent exposure of physiological signals, e.g., hormones, antibodies, peptides, antigens, 
20 cytokines, growth factors, action potentials, pharmacological agents including 

chemotherapeutics, radiation, carcinogenics, or other cells (e.g., cell-cell contacts). In another 
example, the determinations are determined at different stages of the cell cycle process. 

In this way, compounds that modulate lung cancer agents are identified. Compounds 
with pharmacological activity are able to enhance or interfere with the activity of the lung 
25 cancer protein. Once identified, similar structures are evaluated to identify critical structural 
feature of the compound. 

In one embodiment, a method of inhibiting lung cancer cell division is provided. The 
method comprises administration of a lung cancer inhibitor. In another embodiment, a 
method of inhibiting lung cancer is provided. The method may comprise administration of a 
30 lung cancer inhibitor. In a further embodiment, methods of treating cells or individuals with 
lung cancer are provided, e.g., comprising administration of a lung cancer inhibitor. 

In one embodiment, a lung cancer inhibitor is an antibody as discussed above. In 
another embodiment, the lung cancer inhibitor is an antisense molecule. 
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A variety of cell growth, proliferation, viability, and metastasis assays are known to 
those of skill in the art, as described below. 



Soft agar growth or colony formation in suspension 
5 Normal cells require a solid substrate to attach and grow. When the cells are 

transformed, they lose this phenotype and grow detached from the substrate. For example, 
transformed cells can grow in stirred suspension culture or suspended in semi-solid media, 
such as semi-solid or soft agar. The transformed cells, when transfected with tumor 
suppressor genes, regenerate normal phenotype and require a solid substrate to attach and 

10 grow. Soft agar growth or colony formation in suspension assays can be used to identify 
modulators of lung cancer sequences, which when expressed in host cells, inhibit abnormal 
cellular proliferation and transformation. A therapeutic compound would reduce or eliminate 
the host cells' ability to grow in stirred suspension culture or suspended in semi-solid media, 
such as semi-solid or soft. 

1 5 Techniques for soft agar growth or colony formation in suspension assays are 

described in Freshney (1994) Culture of Animal Cells a Manual of Basic Technique (3 rd ed.), 
herein incorporated by reference. See also, the methods section of Garkavtsev, et al. (1996), 
supra, herein incorporated by reference. 



20 Contact inhibition and density limitation of growth 

Normal cells typically grow in a flat and organized pattern in a petri dish until they 
touch other cells. When the cells touch one another, they are contact inhibited and stop 
growing. When cells are transformed, however, the cells are not contact inhibited and 
continue to grow to high densities in disorganized foci. Thus, the transformed cells grow to a 

25 higher saturation density than normal cells. This can be detected morphologically by the 
formation of a disoriented monolayer of cells or rounded cells in foci within the regular 
pattern of normal surrounding cells. Alternatively, labeling index with ( H)-thymidine at 
saturation density can be used to measure density limitation of growth. See Freshney (1994), 
supra. The transformed cells, when transfected with tumor suppressor genes, regenerate a 

30 normal phenotype and become contact inhibited and would grow to a lower density. 

In this assay, labeling index with ( 3 H)-thymidine at saturation density is a preferred 
method of measuring density limitation of growth. Transformed host cells are transfected 
with a lung cancer-associated sequence and are grown for 24 hours at saturation density in 
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non-limiting medium conditions. The percentage of cells labeling with ( H)-thymidine is 
determined autoradiographically. See, Freshney (1994), supra. 

Growth factor or serum dependence 

Transformed cells typically have a lower serum dependence than their normal 
counterparts (see, e.g., Temin (1966) J. Natl. Cancer Insti. 37:167-175; Eagle, et al. (1970) L 
Exp. Med. 131:836-879); Freshney, supra. This is in part due to release of various growth 
factors by the transformed cells. Growth factor or serum dependence of transformed host 
cells can be compared with that of control. 

Tumor specific markers levels 

Tumor cells release an increased amount of certain factors (hereinafter "tumor 
specific markers") than their normal counterparts. For example, plasminogen activator (PA) 
is released from human glioma at a higher level than from normal brain cells (see, e.g., 
Gullino, " Angiogenesis, tumor vascularization, and potential interference with tumor growth" 
in Mihich (ed. 1985) Biological Responses in Cancer , pp. 178-184). Similarly, Tumor 
angiogenesis factor (TAF) is released at a higher level in tumor cells than their normal 
counterparts. See, e.g., Folkman (1992) "Angiogenesis and Cancer" in Sem Cancer Biol.) . 

Various techniques which measure the release of these factors are described in 
Freshney (1994), supra. Also, see, Unkeless, et al. (1974) J. Biol. Chem. 249:4295-4305; 
Strickland and Beers (1976) J. Biol. Chem . 251:5694-5702; Whur, et al. (1980) Br. J. Cancer 
42:305-312; Gullino, "Angiogenesis, tumor vascularization, and potential interference with 
tumor growth" in Mihich (ed. 1985) Biological Responses in Cancer , pp. 178-184; Freshney 
Anticancer Res. 5:111-130 (1985). 

Invasiveness into Matrigel 

The degree of invasiveness into Matrigel or some other extracellular matrix 
constituent can be used as an assay to identify compounds that modulate lung cancer- 
associated sequences. Tumor cells exhibit a good correlation between malignancy and 
invasiveness of cells into Matrigel or some other extracellular matrix constituent. In this 
assay, tumorigenic cells are typically used as host cells. Expression of a tumor suppressor 
gene in these host cells would decrease invasiveness of the host cells. 
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Techniques described in Freshney (1994), supra, can be used. Briefly, the level of 
invasion of host cells can be measured by using filters coated with Matrigel or some other 
extracellular matrix constituent. Penetration into the gel, or through to the distal side of the 
filter, is rated as invasiveness, and rated histologically by number of cells and distance 
5 moved, or by prelabeling the cells with 125 I and counting the radioactivity on the distal side of 
the filter or bottom of the dish. See, e.g., Freshney (1984), supra. 



Tumor growth in vivo 

Effects of lung cancer-associated sequences on cell growth can be tested in transgenic 

10 or immune-suppressed mice. Knock-out transgenic mice can be made, in which the lung 
cancer gene is disrupted or in which a lung cancer gene is inserted. Knock-out transgenic 
mice can be made by insertion of a marker gene or other heterologous gene into the 
endogenous lung cancer gene site in the mouse genome via homologous recombination. 
Such mice can also be made by substituting the endogenous lung cancer gene with a mutated 

15 version of the lung cancer gene, or by mutating the endogenous lung cancer gene, e.g., by 
exposure to carcinogens. 

A DNA construct is introduced into the nuclei of embryonic stem cells. Cells 
containing the newly engineered genetic lesion are injected into a host mouse embryo, which 
is re-implanted into a recipient female. Some of these embryos develop into chimeric mice 

20 that possess germ cells partially derived from the mutant cell line. Therefore, by breeding the 
chimeric mice it is possible to obtain a new line of mice containing the introduced genetic 
lesion (see, e.g., Capecchi, et al. (1989) Science 244:1288). Chimeric targeted mice can be 
derived according to Hogan, et al. (1988) Manipulating the Mouse Embrvo: A Laboratory 
Manual . Cold Spring Harbor Laboratory and Robertson (ed. 1987) Teratocarcinomas and 

25 Embryonic Stem Cells: A Practical Approach . , IRL Press, Washington, D.C. 

Alternatively, various immune-suppressed or immune-deficient host animals can be 
used. For example, genetically athymic "nude" mouse (see, e.g., Giovanella, et al. (1974) J. 
Natl. Cancer Inst. 52:921), a SCID mouse, a thymectomized mouse, or an irradiated mouse 
(see, e.g., Bradley, et al. (1978) Br. J. Cancer 38:263; Selby, et al. (1980) Br. J. Cancer 41:52) 

30 can be used as a host. Transplantable tumor cells (typically about 10 6 cells) injected into 

isogenic hosts will produce invasive tumors in a high proportions of cases, while normal cells 
of similar origin will not. In hosts which developed invasive tumors, cells expressing a lung 
cancer- associated sequences are injected subcutaneously. After a suitable length of time, 
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preferably 4-8 weeks, tumor growth is measured (e.g., by volume or by its two largest 
dimensions) and compared to the control. Tumors that have statistically significant reduction 
(using, e.g., Student's T test) are said to have inhibited growth. 

5 Polynucleotide modulators of lung cancer 

Antisense and RNAi Polynucleotides 

In certain embodiments, the activity of a lung cancer-associated protein is 
downregulated, or entirely inhibited, by the use of antisense or an inhibitory polynucleotide, 
i.e., a nucleic acid complementary to, and which can preferably hybridize specifically to, a 

10 coding mRNA nucleic acid sequence, e.g., a lung cancer protein mRNA, or a subsequence 
thereof. Binding of the antisense polynucleotide to the mRNA reduces the translation and/or 
stability of the mRNA. 

In the context of this invention, antisense polynucleotides can comprise naturally- 
occurring nucleotides, or synthetic species formed from naturally-occurring subunits or their 

1 5 close homologs. Antisense polynucleotides may also have altered sugar moieties or inter- 
sugar linkages. Exemplary among these are the phosphorothioate and other sulfur containing 
species which are known for use in the art. Analogs are comprehended by this invention so 
long as they function effectively to hybridize with the lung cancer protein mRNA. See, e.g., 
Isis Pharmaceuticals, Carlsbad, CA; Sequitor, Inc., Natick, MA. 

20 Such antisense polynucleotides can readily be synthesized using recombinant means, 

or can be synthesized in vitro. Equipment for such synthesis is sold by several vendors, 
including Applied Biosystems. The preparation of other oligonucleotides such as 
phosphorothioates and alkylated derivatives is also well known to those of skill in the art. 
Antisense molecules as used herein include antisense or sense oligonucleotides. 

25 Sense oligonucleotides can, e.g., be employed to block transcription by binding to the anti- 
sense strand. The antisense and sense oligonucleotide comprise a single-stranded nucleic 
acid sequence (either RNA or DNA) capable of binding to target mRNA (sense) or DNA 
(antisense) sequences for lung cancer molecules. A preferred antisense molecule is for a lung 
cancer sequence in the tables, or for a ligand or activator thereof. Antisense or sense 

30 oligonucleotides, according to the present invention, comprise a fragment generally at least 
about 14 nucleotides, preferably from about 14 to 30 nucleotides. The ability to derive an 
antisense or a sense oligonucleotide, based upon a cDNA sequence encoding a given protein 
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is described in, e.g., Stein and Cohen (1988) Cancer Res. 48:2659 and van der Krol, et al. 
(1988) BioTechniaues 6:958). 

RNA interference is a mechanism to suppress gene expression in a sequence specific 
manner. See, e.g., Brumelkamp, et al. ^2002) Sciencexpress (21March2002); Sharp (1999) 
Genes Dev. 13:139-141; and Cathew (2001) Curr. Op. Cell Biol. 13:244-248. In mammalian 
cells, short, e.g., 21 nt, double stranded small interfering RNAs (siRNA) have been shown to 
be effective at inducing an RNAi response. See, e.g., Elbashir, et al. (2001) Nature 411:494- 
498. The mechanism may be used to downregulate expression levels of identified genes, e.g., 
treatment of or validation of relevance to disease. 



Ribozymes 

In addition to antisense polynucleotides, ribozymes can be used to target and inhibit 
transcription of lung cancer-associated nucleotide sequences. A ribozyme is an RNA 
molecule that catalytically cleaves other RNA molecules. Different kinds of ribozymes have 

15 been described, including group I ribozymes, hammerhead ribozymes, hairpin ribozymes, 
RNase P, and axhead ribozymes (see, e.g., Castanotto, et al. (1994) Adv. in Pharmacology 
25: 289-317 for a general review of the properties of different ribozymes). 

The general features of hairpin ribozymes are described, e.g., in Hampel, et al. (1990) 
Nucl. Acids Res. 18:299-304; European Patent Publication No. 0 360 257; U.S. Patent No. 

20 5,254,678. Methods of preparing are well known to those of skill in the art (see, e.g., WO 
94/26877; Ojwang, et al. (1993) Proc. Natl. Acad. Sci. USA 90:6340-6344; Yamada, et al. 
(1994) Human Gene Therapy 1:39-45; Leavitt, et al. (1995) Proc. Natl. Acad. Sci. USA 
92:699-703; Leavitt, et al. (19994) Human Gene Therapy 5:1 151-120; and Yamada, et al. 
(1994) Virology 205: 121-126). 

25 Polynucleotide modulators of lung cancer may be introduced into a cell containing the 

target nucleotide sequence by formation of a conjugate with a ligand binding molecule, as 
described in WO 91/04753. Suitable ligand binding molecules include, but are not limited to, 
cell surface receptors, growth factors, other cytokines, or other ligands that bind to cell 
surface receptors. Preferably, conjugation of the ligand binding molecule does not 

30 substantially interfere with the ability of the ligand binding molecule to bind to its 

corresponding molecule or receptor, or block entry of the sense or antisense oligonucleotide 
or its conjugated version into the cell. Alternatively, a polynucleotide modulator of lung 
cancer may be introduced into a cell containing the target nucleic acid sequence, e.g., by 
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formation of an polynucleotide-lipid complex, as described in WO 90/10448. It is 
understood that the use of antisense molecules or knock out and knock in models may also be 
used in screening assays as discussed above, in addition to methods of treatment. 

Thus, in one embodiment, methods of modulating lung cancer in cells or organisms 

m 

are provided. In one embodiment, the methods comprise administering to a cell an anti-lung 
cancer antibody that reduces or eliminates the biological activity of an endogenous lung 
cancer protein. Alternatively, the methods comprise administering to a cell or organism a 
recombinant nucleic acid encoding a lung cancer protein. This may be accomplished in any 
number of ways. In a preferred embodiment, e.g., when the lung cancer sequence is down- 
regulated in lung cancer, such state may be reversed by increasing the amount of lung cancer 
gene product in the cell. This can be accomplished, e.g., by overexpressing the endogenous 
lung cancer gene or administering a gene encoding the lung cancer sequence, using known 
gene-therapy techniques. In a preferred embodiment, the gene therapy techniques include the 
incorporation of the exogenous gene using enhanced homologous recombination (EHR), e.g., 
as described in PCT/US93/03868, hereby incorporated by reference in its entirety. 
Alternatively, e.g., when the lung cancer sequence is up-regulated in lung cancer, the activity 
of the endogenous lung cancer gene is decreased, e.g., by the administration of a lung cancer 
antisense or RNAi nucleic acid. 

In one embodiment, the lung cancer proteins of the present invention may be used to 
generate polyclonal and monoclonal antibodies to lung cancer proteins. Similarly, the lung 
cancer proteins can be coupled, using standard technology, to affinity chromatography 
columns. These columns may then be used to purify lung cancer antibodies useful for 
production, diagnostic, or therapeutic purposes. In a preferred embodiment, the antibodies 
are generated to epitopes unique to a lung cancer protein; that is, the antibodies show little or 
no cross-reactivity to other proteins. The lung cancer antibodies may be coupled to standard 
affinity chromatography columns and used to purify lung cancer proteins. The antibodies 
may also be used as blocking polypeptides, as outlined above, since they will specifically 
bind to the lung cancer protein. 

Methods of identifying variant lung cancer-associated sequences 

Without being bound by theory, expression of various lung cancer sequences is 
correlated with lung cancer. Accordingly, disorders based on mutant or variant lung cancer 
genes may be determined. In one embodiment, the invention provides methods for 
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identifying cells containing variant lung cancer genes, e.g., determining all or part of the 
sequence of at least one endogenous lung cancer genes in a cell. In a preferred embodiment, 
the invention provides methods of identifying the lung cancer genotype of an individual, e.g., 
determining all or part of the sequence of at least one lung cancer gene of the individual. 
This is generally done in at least one tissue of the individual, and may include the evaluation 
of a number of tissues or different samples of the same tissue. The method may include 
comparing the sequence of the sequenced lung cancer gene to a known lung cancer gene, i.e., 
a wild-type gene. 

The sequence of all or part of the lung cancer gene can then be compared to the 
sequence of a known lung cancer gene to determine if any differences exist. This can be 
done using known homology programs, such as Bestfit, etc. In a preferred embodiment, the 
presence of a difference in the sequence between the lung cancer gene of the patient and the 
known lung cancer gene correlates with a disease state or a propensity for a disease state, as 
outlined herein. 

In a preferred embodiment, the lung cancer genes are used as probes to determine the 
number of copies of the lung cancer gene in the genome. 

In another preferred embodiment, the lung cancer genes are used as probes to 
determine the chromosomal localization of the lung cancer genes. Information such as 
chromosomal localization finds use in providing a diagnosis or prognosis in particular when 
chromosomal abnormalities such as translocations, and the like are identified in the lung 
cancer gene locus. 

Administration of pharmaceutical and vaccine compositions 

In one embodiment, a therapeutically effective dose of a lung cancer protein or 
modulator thereof, is administered to a patient. By "therapeutically effective dose" herein is 
meant a dose that produces effects for which it is administered. The exact dose will depend 
on the purpose of the treatment, and will be ascertainable by one skilled in the art using 
known techniques (e.g., Ansel, et al. (1992) Pharmaceutical Dosage Forms and Drug 
Delivery : Lieberman, Pharmaceutical Dosage Forms (vols. 1-3), Dekker, ISBN 0824770846, 
082476918X, 0824712692, 0824716981; Lloyd (1999) The Art, Science and Technology of 
Pharmaceutical Compounding ; and Pickar (1999) Dosage Calculations^ Adjustments for 
lung cancer degradation, systemic versus localized delivery, and rate of new protease 
synthesis, as well as the age, body weight, general health, sex, diet, time of administration, 
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drug interaction and the severity of the condition may be necessary, and will be ascertainable 
with routine experimentation by those skilled in the art. 

A "patient" for the purposes of the present invention includes both humans and other 
animals, particularly mammals. Thus the methods are applicable to both human therapy and 
5 veterinary applications. In the preferred embodiment the patient is a mammal, preferably a 
primate, and in the most preferred embodiment the patient is human. 

The administration of the lung cancer proteins and modulators thereof of the present 
invention can be done in a variety of ways, including, but not limited to, orally, 
subcutaneously, intravenously, intranasally, transdermally, intraperitoneally, intramuscularly, 

10 intrapulmonary, vaginally, rectally, or intraocularly. In some instances, e.g., in the treatment 
of wounds and inflammation, the lung cancer proteins and modulators may be directly 
applied as a solution or spray. 

The pharmaceutical compositions of the present invention comprise a lung cancer 
protein in a form suitable for administration to a patient. In the preferred embodiment, the 

15 pharmaceutical compositions are in a water soluble form, such as being present as 

pharmaceutically acceptable salts, which is meant to include both acid and base addition 
salts. "Pharmaceutically acceptable acid addition salt" refers to those salts that retain the 
biological effectiveness of the free bases and that are not biologically or otherwise 
undesirable, formed with inorganic acids such as hydrochloric acid, hydrobromic acid, 

20 sulfuric acid, nitric acid, phosphoric acid and the like, and organic acids such as acetic acid, 
propionic acid, glycolic acid, pyruvic acid, oxalic acid, maleic acid, malonic acid, succinic 
acid, fumaric acid, tartaric acid, citric acid, benzoic acid, cinnamic acid, mandelic acid, 
methanesulfonic acid, ethanesulfonic acid, p-toluenesulfonic acid, salicylic acid and the like. 
"Pharmaceutically acceptable base addition salts" include those derived from inorganic bases 

25 such as sodium, potassium, lithium, ammonium, calcium, magnesium, iron, zinc, copper, 
manganese, aluminum salts and the like. Particularly preferred are the ammonium, 
potassium, sodium, calcium, and magnesium salts. Salts derived from pharmaceutically 
acceptable organic non-toxic bases include salts of primary, secondary, and tertiary amines, 
substituted amines including naturally occurring substituted amines, cyclic amines and basic 

30 ion exchange resins, such as isopropylamine, trimethylamine, diethylamine, triethylamine, 
tripropylamine, and ethanolamine. 

The pharmaceutical compositions may also include one or more of the following: 
carrier proteins such as serum albumin; buffers; fillers such as microcrystalline cellulose, 

75 



WO 02/086443 PCT/US02/12476 

lactose, corn and other starches; binding agents; sweeteners and other flavoring agents; 
coloring agents; and polyethylene glycol. 

The pharmaceutical compositions can be administered in a variety of unit dosage 
forms depending upon the method of administration. For example, unit dosage forms 
5 suitable for oral administration include, but are not limited to, powder, tablets, pills, capsules 
and lozenges. It is recognized that lung cancer protein modulators (e.g., antibodies, antisense 
constructs, ribozymes, small organic molecules, etc.) when administered orally, should be 
protected from digestion. This is typically accomplished either by complexing the 
molecule(s) with a composition to render it resistant to acidic and enzymatic hydrolysis, or by 

10 packaging the molecule(s) in an appropriately resistant carrier, such as a liposome or a 
protection barrier. Means of protecting agents from digestion are well known in the art. 

The compositions for administration will commonly comprise a lung cancer protein 
modulator dissolved in a pharmaceutically acceptable carrier, preferably an aqueous carrier. 
A variety of aqueous carriers can be used, e.g., buffered saline and the like. These solutions 

15 are sterile and generally free of undesirable matter. These compositions may be sterilized by 
conventional, well known sterilization techniques. The compositions may contain 
pharmaceutically acceptable auxiliary substances as required to approximate physiological 
conditions such as pH adjusting and buffering agents, toxicity adjusting agents and the like, 
e.g., sodium acetate, sodium chloride, potassium chloride, calcium chloride, sodium lactate 

20 and the like. The concentration of active agent in these formulations can vary widely, and 
will be selected primarily based on fluid volumes, viscosities, body weight and the like in 
accordance with the particular mode of administration selected and the patient's needs (e.g., 
Remington's Pharmaceutical Science (15th ed., 1980) and Hardman, et al. (eds. 1996) 
Goodman and Gilman: The Pharmacologial Basis of Therapeutics) . 

25 Thus, a typical pharmaceutical composition for intravenous administration would be 

about 0.1 to 10 mg per patient per day. Dosages from 0.1 up to about 100 mg per patient per 
day may be used, particularly when the drug is administered to a secluded site and not into 
the blood stream, such as into a body cavity or into a lumen of an organ. Substantially higher 
dosages are possible in topical administration. Actual methods for preparing parenterally 

30 administrate compositions will be known or apparent to those skilled in the art, e.g., 

Remington's Pharmaceutical Science and Goodman and Gilman, The Pharmacologial Basis 
of Therapeutics , supra. 
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The compositions containing modulators of lung cancer proteins can be administered 
for therapeutic or prophylactic treatments. In therapeutic applications, compositions are 
administered to a patient suffering from a disease (e.g., a cancer) in an amount sufficient to 
cure or at least partially arrest the disease and its complications. An amount adequate to 
5 accomplish this is defined as a "therapeutically effective dose." Amounts effective for this 
use will depend upon the severity of the disease and the general state of the patient's health. 
Single or multiple administrations of the compositions may be administered depending on the 
dosage and frequency as required and tolerated by the patient. In any event, the composition 
should provide a sufficient quantity of the agents of this invention to effectively treat the 

10 patient. An amount of modulator that is capable of preventing or slowing the development of 
cancer in a mammal is referred to as a "prophylactically effective dose." The particular dose 
required for a prophylactic treatment will depend upon the medical condition and history of 
the mammal, the particular cancer being prevented, as well as other factors such as age, 
weight, gender, administration route, efficiency, etc. Such prophylactic treatments may be 

1 5 used, e.g., in a mammal who has previously had cancer to prevent a recurrence of the cancer, 
or in a mammal who is suspected of having a significant likelihood of developing cancer 
based, at least in part, upon gene expression profiles. Vaccine strategies may be used, in 
either a DNA vaccine form, or protein vaccine. 

It will be appreciated that the present lung cancer protein-modulating compounds can 

20 be administered alone or in combination with additional lung cancer modulating compounds 
or with other therapeutic agent, e.g., other anti-cancer agents or treatments. 

In numerous embodiments, one or more nucleic acids, e.g., polynucleotides 
comprising nucleic acid sequences set forth in the tables, such as antisense or RNAi 
polynucleotides or ribozymes, will be introduced into cells, in vitro or in vivo. The present 

25 invention provides methods, reagents, vectors, and cells useful for expression of lung cancer- 
associated polypeptides and nucleic acids using in vitro (cell-free), ex vivo, or in vivo (cell or 
organism-based) recombinant expression systems. 

The particular procedure used to introduce the nucleic acids into a host cell for 
expression of a protein or nucleic acid is application specific. Many procedures for 

30 introducing foreign nucleotide sequences into host cells may be used. These include the use 
of calcium phosphate transfection, spheroplasts, electroporation, liposomes, microinjection, 
plasma vectors, viral vectors and other well known methods for introducing cloned genomic 
DNA, cDNA, synthetic DNA or other foreign genetic material into a host cell (see, e.g., 
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Berger and Kinimel, Guide to Molecular Cloning Techniques, Methods in Enzvmology 
volume 152 (Berger), Ausubel, et al. (eds. 1999) Current Protocols (supplemented through 
1999), and Sambrook, et al. (1989) Molecular Cloning - A Laboratory Manual (2nd ed., Vol. 
1-3). 

5 In a preferred embodiment, lung cancer proteins and modulators are administered as 

therapeutic agents, and can be formulated as outlined above. Similarly, lung cancer genes 
(including both the full-length sequence, partial sequences, or regulatory sequences of the 
lung cancer coding regions) can be administered in a gene therapy application. These lung 
cancer genes can include antisense or inhibitory applications, e.g., as inhibitory RNA or gene 

10 therapy (e.g., for incorporation into the genome) or as antisense compositions. 

Lung cancer polypeptides and polynucleotides can also be administered as vaccine 
compositions to stimulate HTL, CTL, and antibody responses.. Such vaccine compositions 
can include, e.g., lipidated peptides (see, e.g.,Vitiello, et al. (1995) J. Clin. Invest. 95:341), 
peptide compositions encapsulated in poly(DL-lactide-co-glycolide) ("PLG") microspheres 

15 (see, e.g., Eldridge, et al. (1991) Molec. Immunol. 28:287-294; Alonso, et al. (1994) Vaccine 
12:299-306; Jones, et al. (1995) Vaccine 13:675-681), peptide compositions contained in 
immune stimulating complexes (ISCOMS) (see, e.g., Takahashi, et al. (1990) Nature 
344:873-875; Hu, et al. (1998) Clin Exp Immunol. 113:235-243), multiple antigen peptide 
systems (MAPs) (see, e.g., Tarn (1988) Proc. Natl. Acad. Sci. U.S.A. 85:5409-5413; Tarn 

20 (1996) J. Immunol. Methods 196: 17-32), peptides formulated as multivalent peptides; 

peptides for use in ballistic delivery systems, typically crystallized peptides, viral delivery 
vectors (Perkus, et al., p. 379 In: Kaufmann (ed. 1996) Concepts in vaccine development ; 
Chakrabarti, et al. (1986) Nature 320:535; Hu, et al. (1986) Nature 320:537; Kieny, et al. 
(1986) AIDS Bio/Technology 4:790; Top, et al. (1971) J. Infect. Pis. 124:148; Chanda, et al. 

25 (1990) Virology 175:535), particles of viral or synthetic origin (see, e.g., Kofler, et al. (1996) 
J. Immunol. Methods 192:25; Eldridge, et al. (1993) Sem. Hematol. 30:16; Falo, et al. (1995) 
Nature Med. 7:649), adjuvants (Warren, et al. (1986) Annu. Rev. Immunol. 4:369; Gupta, et 
al. (1993) Vaccine 11:293), liposomes (Reddy, et al. (1992) J. Immunol. 148:1585; Rock 
(1996) Immunol. Today 17:131), or, naked or particle absorbed cDNA (Ulmer, et al. (1993) 

30 Science 259:1745; Robinson, et al. (1993) Vaccine 1 1:957; Shiver, et al., p. 423 In: 

Kaufmann (ed. 1996) Concepts in vaccine development : Cease and Berzofsky (1994) Annu. 
Rev. Immunol. 12:923 and Eldridge, et al. (1993) Sem. Hematol. 30:16). Toxin-targeted 
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delivery technologies, also known as receptor mediated targeting, such as those of Avant 
Immunotherapeutics, Inc. (Needham, Massachusetts) may also be used. 

Vaccine compositions often include adjuvants. Many adjuvants contain a substance 
designed to protect the antigen from rapid catabolism, such as aluminum hydroxide or 
mineral oil, and a stimulator of immune responses, such as lipid A, Bortadella pertussis or 
Mycobacterium tuberculosis derived proteins. Certain adjuvants are commercially available 
as, e.g., Freund's Incomplete Adjuvant and Complete Adjuvant (Difco Laboratories, Detroit, 
MI); Merck Adjuvant 65 (Merck and Company, Inc., Rahway, NJ); AS-2 (SmithKline 
Beecham, Philadelphia, PA); aluminum salts such as aluminum hydroxide gel (alum) or 
aluminum phosphate; salts of calcium, iron or zinc; an insoluble suspension of acylated 
tyrosine; acylated sugars; cationically or anionically derivatized polysaccharides; 
polyphosphazenes; biodegradable microspheres; monophosphoryl lipid A and quil A. 
Cytokines, such as GM-CSF, interleukin-2, -7, -12, and other like growth factors, may also be 
used as adjuvants. 

Vaccines can be administered as nucleic acid compositions wherein DNA or RNA 
encoding one or more of the polypeptides, or a fragment thereof, is administered to a patient. 
This approach is described, for instance, in Wolff, et. al. (1990) Science 247:1465 as well as 
U.S. Patent Nos. 5,580,859; 5,589,466; 5,804,566; 5,739,118; 5,736,524; 5,679,647; WO 
98/04720; and in more detail below. Examples of DNA-based delivery technologies include 
"naked DNA", facilitated (bupivicaine, polymers, peptide-mediated) delivery, cationic lipid 
complexes, and particle-mediated ("gene gun") or pressure-mediated delivery (see, e.g., U.S. 
Patent No. 5,922,687). 

For therapeutic or prophylactic immunization purposes, the peptides of the invention 
can be expressed by viral or bacterial vectors. Examples of expression vectors include 
attenuated viral hosts, such as vaccinia or fowlpox. This approach involves the use of 
vaccinia virus, e.g., as a vector to express nucleotide sequences that encode lung cancer 
polypeptides or polypeptide fragments. Upon introduction into a host, the recombinant 
vaccinia virus expresses the immunogenic peptide, and thereby elicits an immune response. 
Vaccinia vectors and methods useful in immunization protocols are described in, e.g., U.S. 
Patent No. 4,722,848. Another vector is BCG (Bacille Calmette Guerin). BCG vectors are 
described in Stover, et al. (1991) Nature 351 :456~460. A wide variety of other vectors useful 
for therapeutic administration or immunization e.g., adeno and adeno-associated virus 
vectors, retroviral vectors, Salmonella typhi vectors, detoxified anthrax toxin vectors, and the 
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like, will be apparent to those skilled in the art from the description herein (see, e.g., Shata, et 
al. (2000) Mol Med Today 6:66-71; Shedlock, et al. (2000) J. Leukoc. Biol. 68:793-806; 
Hipp, et al. (2000) In Vivo 14:571-85). 

Methods for the use of genes as DNA vaccines are well known, and include placing a 
5 lung cancer gene or portion of a lung cancer gene under the control of a regulatable promoter 
or a tissue-specific promoter for expression in a lung cancer patient. The lung cancer gene 
used for DNA vaccines can encode full-length lung cancer proteins, but more preferably 
encodes portions of the lung cancer proteins including peptides derived from the lung cancer 
protein. In one embodiment, a patient is immunized with a DNA vaccine comprising a 

10 plurality of nucleotide sequences derived from a lung cancer gene. For example, lung cancer- 
associated genes or sequence encoding subfragments of a lung cancer protein are introduced 
into expression vectors and tested for their immunogenicity in the context of Class I MHC 
and an ability to generate cytotoxic T cell responses. This procedure provides for production 
of cytotoxic T cell responses against cells which present antigen, including intracellular 

15 epitopes. 

In a preferred embodiment, DNA vaccines include a gene encoding an adjuvant 
molecule with the DNA vaccine. Such adjuvant molecules include cytokines that increase 
the immunogenic response to the lung cancer polypeptide encoded by the DNA vaccine. 
Additional or alternative adjuvants are available. 

20 In another preferred embodiment lung cancer genes find use in generating animal 

models of lung cancer. When the lung cancer gene identified is repressed or diminished in 
metastatic tissue, gene therapy technology, e.g., wherein antisense or inhibitory RNA directed 
to the lung cancer gene will also diminish or repress expression of the gene. Animal models 
of lung cancer find use in screening for modulators of a lung cancer-associated sequence or 

25 modulators of lung cancer. Similarly, transgenic animal technology including gene knockout 
technology, e.g., as a result of homologous recombination with an appropriate gene targeting 
vector, will result in the absence or increased expression of the lung cancer protein. When 
desired, tissue-specific expression or knockout of the lung cancer protein may be necessary. 
It is also possible that the lung cancer protein is overexpressed in lung cancer. As 

30 such, transgenic animals can be generated that overexpress the lung cancer protein. 

Depending on the desired expression level, promoters of various strengths can be employed 
to express the transgene. Also, the number of copies of the integrated transgene can be 
determined and compared for a determination of the expression level of the transgene. 
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Animals generated by such methods will find use as animal models of lung cancer and are 
additionally useful in screening for modulators to treat lung cancer. 



Kits for Use in Diagnostic and/or Prognostic Applications 

For use in diagnostic, research, and therapeutic applications suggested above, kits are 
also provided by the invention. In diagnostic and research applications such kits may include 
at least one of the following: assay reagents, buffers, lung cancer-specific nucleic acids or 
antibodies, hybridization probes and/or primers, antisense polynucleotides, ribozymes, RNAi, 
dominant negative lung cancer polypeptides or polynucleotides, small molecule inhibitors of 
lung cancer-associated sequences, etc. A therapeutic product may include sterile saline or 
another pharmaceutically acceptable emulsion and suspension base. 

In addition, the kits may include instructional materials containing instructions (e.g., 
protocols) for the practice of the methods of this invention. While the instructional materials 
typically comprise written or printed materials they are not limited to such. A medium 
capable of storing such instructions and communicating them to an end user is contemplated 
by this invention. Such media include, but are not limited to electronic storage media (e.g., 
magnetic discs, tapes, cartridges, chips), optical media (e.g., CD ROM), and the like. Such 
media may include addresses to internet sites that provide such instructional materials. 

The present invention also provides for kits for screening for modulators of lung 
cancer- associated sequences. Such kits can be prepared from readily available materials and 
reagents. For example, such kits can comprise one or more of the following materials: a lung 
cancer-associated polypeptide or polynucleotide, reaction tubes, and instructions for testing 
lung cancer-associated activity. Optionally, the kit contains biologically active lung cancer 
protein. A wide variety of kits and components can be prepared according to the present 
invention, depending upon the intended user of the kit and the particular needs of the user. 
Diagnosis would typically involve evaluation of a plurality of genes or products. The genes 
typically will be selected based on correlations with important parameters in disease which 
may be identified in historical or outcome data. 
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Example 1 : Gene Chip Analysis 

Molecular profiles of various normal and cancerous tissues were determined and 
5 analyzed using gene chips. RNA was isolated and gene chip analysis was performed as 

described (Glynne, et al. (2000) Nature 403:672-676; Zhao, et al. (2000) Genes Dev. 14:981- 
993). 



82 



WO 02/086443 



PCT/US02/12476 



Tables 1 A and 1 B were previously filed on April 1 8, 2001 in USSN 60/284,770 (1 8501 -001S00US) and on November 29, 2001 in USSN 60/334,370 
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n qr 


1 fi9 
1 .Oat 


4 nonoc 

102935 


X13482 


• 1 AAr^AA 

Hs.80506 


a Art aI 1 p% ■ ■ a! a ai* riliAn i iaIaaafa^ai n a aI t (HA AT 

small nuciear noonucieoprotein poiypept 


1 91 

I.e. I 


4 9 

H.at 


102972 


\ f A AAA A 

X16662 


Hs.87268 


annexin A8 


1 9R 


9 19 
at. Oat 


102983 


X17620 


I t J J AAAA 

Hs.1 18638 


non-metastatic cens ij protein (immzoaj 


1 ni 

I.UO 


1 fil 
1 .OO 


10J023 


\/TA^A A 

X53793 


1 t 4 4 "7AFTA 

Hs. 11 7950 


muitiiunctionai poiypepuae similar 10 o 


1 RR 
I.OO 


r 44 

O.HH 


103038 


X54941 


Hs.77550 


/A t~\ Av A A _ — -^ 1 — S n )/t n AAA 4 

lul,28 protein Kinase i 


1 V) 


1 7Q 

O. / V 


4 A A A*7IT 

103075 


v /r» A J A 

X59543 


b 1 AAO A 

Hs.2934 


riDonucieotide reductase mi polypeptide 


1 11 
I. I I 


9 RR 

at.OO 


103168 


X68314 


i 1 ATA A 

Hs.2704 


giutatnione peroxidase *i (gastrointesim 


n 7R 

U./O 


1 flR 


J A A J A- 

103185 


\,#*A A A 4 A 

X69910 


11 TJOAO 

Hs.74368 


transmembrane protein (boKU); encopiasmi 


1 ni 

1 .Ul 


1 Q7 


^ noo4 o 

103212 


\/^A A"T 4 

X73874 


1 1 AO AO 

Hs.2393 


« A. An «%M jl AAA ta*l A A A A* nln tl A H / m I 1 f* A 1 A \ 

pnospnoryiase Kinase, aipna i ^muscie; 


n qr 


1 79 

1 . / at 


^noooo 
103223 


\ , j Art A 

X74801 


f t — 4 TAfl 

Hs.1708 


A A A A Al*A At A A A lAl 4 A 1 A T A A TY'^D'f' A 1 1 rS 1 1 H 1*f Q / A 

cnaperonin coniaining i ori, suDunuo \g 


n Q7 


1 77 
i.i/ 


103260 


X78416 


If A 41 r - f— 

Hs.3155 


casein, aipna 


1 
i 


1 
i 


103262 


X78565 


1 1 A A 4 A A A 

Hs.204133 


UnvAUTAArtinA / 4 A A A f A i A ' Alf^ aJ'SaIi A l 

nexaoracnion (tenascin o, cyioiacunj 


1 91 

l.atO 


1 (IQ 


<i nooon 

103330 


X85373 


1 1 4AA 

Hs.77496 


A Art aII «f\ i 1 a(a A r* f*-1 A A 1 1 A 1 A A A fA^ A 1 A A All / A A A^ 

sman nuciear nDonucieoproiein poiypept 


1 19 
I. Ill 


9 9R 


103364 


\ / A A A —T A 

X90872 


11 nrnr J 

Hs.75854 


oULi lb suiiotransTerase 


* 9 RR 


4 R9 

H.Oat 


<<noo"7c 
103375 


\/A A A AO 

X91868 


Ik r* 4 4 4 A 

Hs.54416 


ninA Am > 1 ! o In A Art A A 1^ AU / 1^ rA T> A A trt ll o\ A Alrtrt aI A 

sine ocuus nomeooox ^urosopniiaj nomoio 


1 


2 4ft 

at.HU 


103391 


X /A A IfA 

X94453 


II 4^4 AAA 

Hs. 114366 


pyrroiine-o-carooxyiate syntneiase (giut 


■| 
l 


1 R1 

I.OO 


4 no .1 A A 

1 03404 


X95586 


1 1 *7 A f>A A 

Hs.78596 


■^■■#^.4 « a— — M a / nrnn An^ ai mAArA A Ain\ ^ 1 iKl | A it* 

proteasome (prosome, macropam; suDunu, 


n Q9 


1 R1 
1 .oo 


J AA i A7 

103437 


x/ A A AAA 

X98260 


1 1 AAAr A 

Hs.82254 


M-pnase pnospnoprotein n 


u.y*< 


1 R4 

1 .OH 


103448 


WAnJ A A 

X99133 


1 \ OA A AOO 

Hs.204238 


IiaakaIi a *J ( Ar^nnAnnn "J A r~*. J \ 

npocaiin z (oncogene 24poj 


U.OD 


n qr 

U.90 


J AA AAP 

103605 


*ror" J oo 

Z35402 


t 1 4 A i AAT 

Hs. 194657 


M«flJl«AvS*« A a AA/lknviA fAMllnAl I aI I 

cadnenn 1; b-cadnerm (epitnenai^ 


1 Q9 
I.OZ 


9 R1 

at.O I 


4 noc JtC 

103646 


Z68228 


Hs.2340 


junction piaKogioDin 


n rr 

U.00 


1 9R 

1 .atO 


103658 


Z74615 


Hs.172928 


Anil AAAn 1 4 | .HA I I 1 *-l A fl^ 4 

collagen; type I, aipna i 


1 OR 
I.UO 


9 QR 

at. SO 


>l An»t*i 2 

103774 


AA092898 


Hs.92918 


COX™. lAI/sntslif nimlln^ i~ DQ7PQ Q rP olnnn 

ho I s; weaKiy similar to ku/vjo,o [u.eiega 


1 RR 
I.OO 


4 RR 

H.OO 


J Al AAJ 

104261 


AF008442 


Hs.5409 


kna polymerase I suounit 


U.O/ 


9 17 

at. i f 


104276 


C02193 


Hs.85222 


to I s) weaKiy similar to k*ii uau_ *i [n.sapi 


1.1 


9 4Q 

at.HO 


4 n 4oon 

104289 


C16281 


Hs.75478 


rvlAAUyoD pTOtGin 


1 1R 
I. ID 


1 Rft 
1 .uo 


4 nj >iovi 
104434 


L02870 


Hs.1640 


aaI1«"iaaa*> 4i 1 a a \ /I I » a) nnn 4 /a nt rtl firm oK ja 

conagen, type vn, aipna i ^epiacrmuiys 


1 nA 

I.U*f 


1 49 

1 «H9 


104453 


M19169 


Hs.123114 


cystatin SN 


0.38 


0.76 


104611 


R98280 


Hs. 125845 


ribu!ose-5-phosphate-3-epimerase 


1.08 


2.25 


104758 


M024661 


Hs.7010 


ESTs; Weakly similar to ACYL-COA DEHYDRO 


1.14 


1.65 


105114 


M156532 


Hs.11801 


adenosine A2b receptor pseudogene 


0.91 


1.38 


105132 


M159501 


Hs.247280 


HBV associated factor 


1.08 


1.7 


105174 


M186613 


Hs.34744 


ESTs 


0.95 


2.05 
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105280 


AA232215 


HS.14bUU 


PCTn 

bo IS 


A 
I 


1 A 


i nro A A 

05344 


A A OOCOAn 

AA235303 


Hs.ob4b 


CO IS 




0 AO 

z.uz 


a a a 4 A 

05516 


AA257971 


Hs. 21214 


ESTS 


l.ob 


1 RR 

o.bb 


05621 


AA280865 


Hs.bo7b 


Homo sapiens mRNA; cUNA UKhZpbb4i\u^ii 




1 RO 


05698 


AA287393 


Hs. 15202 


1 1" 1 — _ . \ n. W At* AfH T^l. > a . i-. . 1 ^ _ _ A a V . 4b a. *J j% Ami w^jmi, mm U WWa**l 

EoTs; Weakly similar to oiigodendrocyte- 


u.yo 


1 on 


A a^ A a 

05705 


A A A A A*7 A •'7 

AA290767 


HS. 101 282 


l|.„. __„»,__ m nk|Ai -PIMA ni/[T7r»>fOytDH AO ffr 

Homo sapiens mRNA; cuNA UKrZp4d4biUz (tr 




1 QO 


A j— ^ A l 

05724 


AA292098 


HS.229J4 


r— f>T_. »«!_ _(.|,, | __ i_ -71 Kl /-> CIM/^CD DDAT 

EoTs; Weakly similar to ZINC riNtahK rKU 1 


n qq 
u.yy 


1 A1 


05782 


A A A P" AO *4 F? 

AA350215 


t f » 04] COA 

Hs.21580 


EoTs 


i 


A 

1 


05799 


A A AT A A A O 

AA372018 


Hs.24743 


PPT. 

to IS 


1 nn 


1 7R 
l.f 0 


a r- a a - * 

05807 


A A A A A A A A 

AA393803 


Hs.16869 


ESTs; Moderately similar to uullagen alm 


u.yb 


1.04 


105891 


A A 4 A A"T AO 

AA400768 


1 1. AAAA A 

Hs.26662 


ESTs; Weakly similar to tumor necrosis f 


n Q7 
U.df 


0 OK 


/> ^ A A A 

1 05936 


A A 4 A 4 A A A 

AA404338 




ESTs 


1.14 


1 AR 
1.4b 


06069 


AA417741 


Hs.29899 


to I s; weakly similar to z.inu riNbtK rKU i 


1 


1 


106103 


A A 4 A A A f\ A 

AA421104 


i l _ A Ann A 

Hs. 12094 


rpT. 

ESTs 


1 A/l 


1 AA 
1. 44 


I A A A A C\ 

106140 


A A J A 4 C O, A 

AA424524 


I |_ A A (-1 A o 

Hs. 14912 


KiAAOZbb protein 




0 11 


106149 


A A A n AOOA 

AA424881 


Hs.zobdOl 


CCTi. 

to IS 


A fkl 
U.00 


1 Aft 


l r\ a 4 r* A 

106154 


A A 4 A p- A A A 

AA425304 


Hs.6994 


tb IS 


A 77 


0 AR 
£.U0 


106182 


M426609 


Hs.108b2 


to IS 


A 7A 


0 03 


106220 


AA428582 


HS.o2iyb 


to i s, Moderately similar to metargidin p 


A Q7 


1 QQ 
i .yy 


106228 


AA429290 


HS. 17719 


to IS 


A QQ 

u.yy 


1 RA 
1. 04 


106318 


AA43bb7Q 


u„ ncnc 

Hs.ybuo 


pre-mKNA cleavage ractor im (^bKuj 


A QR 

u.yo 


0 AQ 


106341 


A A A A A "jno 

M441798 


HS.5243 


CCTi«. 1 1. J., r _l.|.. _!_,;i_ r i_ _H O Umnlhn 

to 1 s; Moderately similar to pit_z nypotne 


A Oft 

u.yo 


0 RR 
Z.uO 


I ftp j aa 

1 06432 


AA448850 


Hs.1 nd8 


to is 


fi Q^ 
u.yo 


1 Q3 
i.yo 


I A/"* A~7 A 

1 06474 


A A A rftA4 A 

AA450212 


HS.42484 


Homo sapiens mKNA, cuna ui\rz.pbb / fL-ubJ tir 




1 


[ aa ino 

[06483 


A A A CA C7C 

AA451676 


Hs.oU2yy 


ibr-ii mKNA-uinding protein c 




9 9Q 


l a a /* a f\ 

106599 


aaa niic 

AA457235 


Hs.1 2842 


to I s; Moderately similar to non-iunction 


1 


1 ft9 
I .oz 


1 /\/>/>4 4 

106611 


A A ACOF\l\A 

AA458904 


|_|_ OCOC7 

Hs.2b2b/ 


to I s, weakly similar to torsinA [n.sapie 


1 AQ 


9 7ft 

£.10 


106654 


a a Ar*f\A An 

M460449 


HS.3784 


P A 1 Al 1 ]tm Mill ■ rvk W t j*h ^ m j«* « A A •>•■ nnA 

to I s, Higniy similar to pnospnosenne am 


i 


1 A 


107076 


A A A A A 4 4 f 

AA609145 


Hs.21143 


ESTs; Weakly similar to fos395b4_l [n.sa 


1. 1 I 


1 AQ 

i.4y 


107115 


A a cl AH AO 

AA610108 


ii„ OVCQO 

HS.2/b9o 


rPTp. LlinhKr cimilnr in APM 1 0/! nrnfotn 

to I s, nigniy similar to ubi-i<i4 protein 


1 
I 


I .UJ 


107129 


AAbZUbbo 


HS.4f0b 


471 nn A 4l*f IaIi II^A AAAAlftA AllAAntlA AAPA I 

Tiap structure-speciiic enoonuciease i 


1 1^ 
I • 10 


O.DO 


4 r>>—7 A r* a 

107159 


A APHONIA 

AA621340 


1 i_ 4f\cr\r\ 

Hs. 10600 


tSTs; weakly similar to UKr ykkuoic [o.c 


1 AR 
I.UO 


0 AQ 

z,uy 


4 A - j AAA 

107444 


l A IA A A A 4 

W28391 


Hs.5181 


proliferauon-associated 2b4; o8kU 


l.lo 


1 Q 

i.y 


1 f\~r An A 

107481 


lAlCQ^I A"^ 

W58247 


Hs.27437 


Homo sapiens kinesin superfamily motor K 


A QQ 

u.yy 


0 7A 


4 r\"7 a A a 

107516 


X56597 


Hs.99853 


tiDnliann 


A QA 

u.y»t 


1 77 
l.f* 


107529 


Y12065 


11. CAAA 

Hs.5092 


nucleolar protein (KKt/u repeat) 


I.UO 


0 10, 

z.zy 


107531 


\/ 4 AAA A 

Y13936 


i i_ A-rnnn 

Hs.17883 


protein pnospnatase lb (formerly 20), ma 


1 AR 
I.UO 


1 RO 
l.OZ 


107801 


AA019433 


|j„ i1*704AA 

Hs. 1731 00 


ESTS 


I.UO 


1 A 
1. 4 


107957 


A A /\o 4n^f) 

AA031948 


II _ C"7CjIO 

Hs.57548 


COT., 
to IS 


A 

u.yo 


1 AR 


i a a a 

108565 


a A nnri i a 

AA085342 


Hs.1 526 


ATPase; Ca++ transporting; cardiac muse) 


n cq 
u.oy 


1 3R 
i.00 


108780 


A A A AnpAJ 

AA1 28561 


1 K 4 4 7AAQ 

Hs.1 17938 


collagen; type avI>; alpha 1 


A 

l 


7 R*? 

/.bo 


4 Ann 

108828 


A A 4 A 4 r~A 4 

AA131584 


Hs.71435 


DKFZP564O04b3 protein 


1 .00 


0 RR 
Z.Ob 


4 n a a a a 

109060 


A A 4 AAfllA 

AA1 60879 


Hs.241551 


chloride channel; calcium activated; tarn 


n C7 


1 AO 
I.4Z 


4 a a ^ <4 a 

109112 


4 4 J /> A A ^A 

AA1 69379 


Hs. 72865 


EoTs 


AQ 


Z.O l 


r a a A 4 J 

! 09344 


A A A 4 AAAA 

AA213696 


1 1 AAAA A 

Hs.86559 


po!y{A)-binding protein-like 1 


n 07 
U.yY 


1 RR 
1.00 


t An J j n 

109412 


A A AA^4 A f" 

AA227145 


1 1 • AAA 4 *7 A 

Hs.209473 


fOT... \A/ A ^.I.).. nla.ll.. i— ryr~f*i || ATHD P\IT KIT 

ESTs; Weakly similar to REbULAl UR Ur Ml I 


n 7R 
u. /b 


1 87 
I. Of 


110780 


■ inn 4 T 4 

N23174 


t i— a a a n 4 

Hs.22891 


solute carrier family 7 (cationic amino 


n q 

u.y 


n QR 

u.yo 


110958 


N50550 


Hs. 24587 


HIM w «.| l.j> n _ t*i t |rS 4l j^ hwmImi A / 1 1 O A A A 4 AI A 

signal transduction protein (ono contain 


1 17 
I. if 


9 9fi 
z.zo 


111018 


Mr* 4 A A "7 

N54067 


Hs.3628 


mitogen-activated protein kinase kinase 


I.Zl 


1 fiR 
I.OO 


1 j j a a^ 

111337 


N79612 


Hs.16607 


to I s; Higniy similar to Myosin heavy cna 


1 


1 AR 


4 u aa a/" 

112305 


n 4 A A A 

R54822 


Hs.26244 


ESTs 


A 

1 


A 
i 


112401 


no 4 a a 

R61279 


Hs.237536 


rPT* . 1 A /_ — 1,1. , _!_.:■__ 1_ C1CDC O TA Alana 

ESTs; weakly similar to f-Zoao.o [O.eiega 


1 OA 


1 RA 
1. 04 


112853 


T A A A 4 A 

T02843 


Hs.4351 


COT 

EST 


1 RR 
1.00 


1 QR 

i.yo 


112869 


VAA A 4 A 

T03313 


II. J "7 yl "7 

Hs.4747 


jjJ . 3 mm 1 At Awm v j^ 4 j% 0* ■ jf^ jAh jAh r%k ju j« n T I «■ 4 ■ jj . ja I jaaHM 

dyskeratosis congenita 1; dyskenn 


1 A^ 
I.UO 


1 R7 
I. Or 


A 4 aa AA 

112992 


TAOr j4 a 

T23513 


Hs.7147 


to IS 


I 


1 


1 1 3048 


T25895 


HS.184UU8 


to I s; weakly similar to KNA-Dinding prot 


1 ^7 
I. Of 


9 9R 
z.zu 


A A on^<i 

113063 


T32438 


Hs.bUz/ 


rpT. 

to IS 


1 


1 


113179 


T55182 


11. HCACT'I 

HS.1 520/1 


to I s, nigniy similar to ibr-n mKNA-Dina 


I.OO 


9 7 
z. / 


113573 


TA4 4 A A 

T91 1 66 


I I. a cnnA 

Hs. 15990 


to IS 


A 7R 
U. i 0 


1 A7 
1 .4/ 


113811 


111 1 i AAA 

W44928 


Hs.4878 


rpT. 

ESTS 


A 7Q 

u. /y 


1 R1 
1 .0 1 


114086 


Z38266 


[l_ Af\Tjr\ 

HS.1 2770 


LJaa^a aaaiaaa DA aIaaa T~\ 1 Pi 7 7 *7 0 Q fmm 7n 

Homo sapiens rAU clone uju^ / /uzo trom /p 


A Q 

u.y 


1 3A 
1.04 


4 4 4 r*n*9 

114587 


A A A"7 A n A"* 

M070827 


II. A OAAAA 

Hs. 180320 


cota. » « *_ _ -4— f+rti r»i >i tdakiokjickji 

ESTs; Weakly similar to GQLbl 4-1 RANoMtM 


1 AO 


1 7R 
1. 1 b 


4 4 4 A 4 A 

114846 


A A AO JAAA 

AA234929 


Hs.44343 


rpj. 

ESTs 


■1 QO 
1.J4 


9 3R 
Z.Ob 


4 A 4 n A 4 

114964 


AA243873 


1 f- AA4 A 4 

Hs. 82184 


ring finger protein 3 


n 1 

1.1 


1 P/l 
1.04 


4? A r^A 4 T 

115047 


A A A AA*7 

AA252627 


Hs. 22554 


homeo box B5 


1 ni 


9 3R 
Z.OO 


4) 4 1-4 A A 

115166 


A A APA A f\f\ 

AA258409 


Hs. 198907 


myelin protein zero-like 1 


1 AR 
I.UO 


0 31 
Z.O I 


A A r*A *t 

115167 


A A APA A A4 

AA258421 


Hs.43728 


hypothetical protein 


1 KO 
1.0*1 


0 RO 
Z.oZ 


4 4 POO o 

1 1 5239 


A A O^OArA 

AA278650 


HS.73291 


r~ r** i j»« • \ Pits*. 4^t>«t ■ t aiw%!Iai> 4a AimllAi* 4a 4aa W 

to I s; weakly similar to similar to me o 


A 7 
U. / 


0 R7 
Z.O/ 


4 4 f*n*?rt 

115278 


AA279757 


I l_ 0"7>tOff 

Hs.67466 


Eo Ts; Weakly similar to bAbNoZbn.d [U.m 


1 IA 
1. l*t 


0 10 
Z. IZ 


115652 


A A JACAAO 

AA405098 


1_]_ 00170 

Hs. 38178 


COT/, 
to IS 


n no 

U.OA 


A R7 
4.0/ 


4 4 j» A""» r* 

115875 


a a JAAAilA 

AA433943 


Hs.43946 


r^OTj*! \ A _ t . t » » AikaiIjik 1a I A f Am. n,\ At A— | ml T 1 A wpt 1% f 

to 1 s; Weakly similar to weak similarity 


1 0 
1.Z 


1 on 
i.yo 


4 4 AAA 4 

116004 


A A j J A4 A A 

AA449122 


Hs.7608b 


to I s; Highly similar to small zinc tinge 


n qr 
u.yo 


1 31 
1 .0 I 


4 4 A 4 n 4 

116121 


AAA r- A A P" 4 

AA459254 


Hs.48855 


ESTs 


n Q7 

u.y/ 


1 RR 
1.00 


4 4 A 4 A A 

116129 


a a 4 pr\n c/** 

AA459956 


Hs.49163 


f"OT»ll 1 JinUti 1 j— \ il-j! i_ pMtlrtlilfA riAAAIlA 

tb I s; Highly similar to putative noonuc 


•\ Afl 
I.UO 


0 73 
Z. /O 


A 4 A 4 A A 

116190 


A A 4 A J AAA 

AA464963 


Hs.67776 


rpT. 

ESTs 


fi R 

u.o 


1 R7 
1 .0/ 


4 4 A A ^ A 

116312 


a A i n a i *~\ 4 

AA490494 


1 1— iAA 

Hs.65403 


ESTs 


t Q7 
1.0/ 


0 RR 
Z.OO 


116732 


f~,4 A j 1 A 

F13779 


i i 4 or*rsnn 

Hs.1 65909 


TAT* 

ESTs 


n oo 


1 R 
1.0 


4 .4 ^ A A A 

117602 


N35020 


I I _ j innr 

Hs.44685 


rpj. , 1,1., _S__!|__ i_ r>/~\\ IATU DDATCfM 

ES r s; Weakly similar to bULiAi h rKU i cin 


1 1R 
1.10 


1 ftA 
1.04 


4 4 ^ a r - A 

117950 


1 IPJ A A A 

N51394 


1 ""7 f? 4 TF A, 

Hs.75478 


KIAA09bb protein 


l.UH 


0 3R 
Z.00 


117992 


N52000 


Hs.1 72089 


Homo sapiens mRNA; cDNA DKFZp586B0222 (f 


0.62 


1.29 


118785 


N75386 


Hs.111867 


GLl-Kruppel family member GLI2 


1 


1 


119717 


W69134 


Hs.57987 


ESTs 


1 


1.4 


119814 


W74069 


Hs.58350 


ESTs 


0.78 


1.77 


120128 


Z38499 


Hs.91448 


MKP-1 like protein tyrosine phosphatase 


0.86 


1.46 


120242 


Z98443 


Hs.86366 


ESTs 


0.83 


2.01 
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1z04b\3 


A A oconn^ 

AA252994 


Up -IC7Q 


apoptosis inniDUor 4 \survivm) 


n 7 a 


1 R4 


121054 


AAo9ob04 


Up 070Q7 


to IS 


1 A5 


1 Q3 
l.i/O 


A f\A oO£ 

121326 


A A Af\A*iAC 

AA404246 


Ur. 07AOH 


COTki lAfppbt.t •ImiUr »/n CimiUp tp n U..U 

bo 1 s; weaKiy similar to oimiiar to pnyto 


u.yo 


I.O 


H OH n^o 
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Table 1B shows the accession numbers for those pkeys in Table 1A lacking unigenelD's. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on' sequence 
similarity using Clustering and Alignment Tools (Doub)eTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
Accession column. 



Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey 



CAT 



Accessions 



100661 
100667 



23182J 
26401 3 



100668 26401 3 



101332 25130.1 



BE623001 L05096 AA383604 AW96641 6 N53295 AA46021 3 AW571519 AA603655 

L05424 X56794 S66400 X55150 W60071 AW351820 X55938 M83326 BE005289 BE070059 M83324 BE005248 BE069717 BE181648 BE069700 
AW606203 BE069721 AW382138 AW803776 BE463954 BE005334 BE005274 T27386 AA932714 AA972695 AW377728 A1632506 T29066 
AI783934 AW377727 BE163715 AL047291 AA279047 AA523003 BE008048 BE440141 W23614 BE090519 BE092193 N29181 N20358 N44153 
BE546944 T69231 AW377441 AA907406 H50799 AW051416 A1420712 BE620922 A1279161 AA992549 W47198 BE005241 AI342696 H50700 
AI969974 AI863855 AA374490 AW1 30675 Al 950633 AA146687 H99482 X55150 BE005414 BE005339 N28294 AI673068 AI887890 AW804171 
A1675961 AW804172 AA778841 AL048050 A11 27757 AI095568 AW204965 AW468978 W31898 AI052595 AI278771 BE464018 AI081503 A1824196 
AA513211 AA411062AW084376 N48752 AA703209 N35580 AW059918M054563 Al 280942 T276 19 BE621435 N66010 AW589527 A1160414 
AA283090 M962536 H82726 W521 15 W45432 W60433 AA577548 AA146714 BE150994 M054615 AW796025 AW382768 BE565671 C00444 
AA054555 

L05424 X56794 S66400 X55150 W60071 AW351820 X55938 M83326 BE005289 BE070059 M83324 BE005248 BE069717 BE181648 BE069700 
AW606203 BE069721 AW382138 AW803776 BE463954 BE005334 BE005274 T27386 M932714 AA972695 AW377728 AI632506 T29066 
A1783934 AW377727 BE163715 AL047291 AA279047 M523003 BE008048 BE440141 W23614 BE090519 BE092193 N29181 N20358 N44153 
BE546944 T69231 AW377441 AA907406 H50799 AW051416 AI420712 BE620922 A1279161 AA992549 W47198 BE005241 AI342696 H50700 
AI969974 AI863855 AA374490 AW130675 A1950633 AA146687 H99482 X55150 BE005414 BE005339 N28294 A1673068 AI887890 AW804171 
AI675961 AW804172 AA778841 AL048050 Al 127757 AI095568 AW204965 AW468978 W31898 AI052595 AI278771 BE46401 8 AI08 1503 AI8241 96 
M51321 1 AA411062 AW084376 N48752 AA703209 N35580 AW059918 AA054563 AI280942 T27619 BE621435 N66010 AW589527 AI160414 
AA283090 AA962536 H82726 W521 15 W45432 W60433 AA577548 AA146714 BE150994 AA054615 AW796025 AW382768 BE565671 C00444 
AA054555 

J04088 NM_001067 AF071747 AJ011741 N85424 AL042407 M218572 BE296748 BE083981 AL040877 AW499918 AW675045 H17813 
BE081283 M670403 AW504327 BE094229 AA1 04024 AI471482 AI970337 AA73761 6 AI827444 AW003286 A1742333 A1344044 AI765634 



91 



WO 02/086443 



PCT/US02/12476 



100780 458J27 
100830 4002J 



100906 4312.1 



100930 16865J 



102221 3861J 



101809 32963J 



102590 15932J 



101977 29073.1 



102781 2081 2_1 



AI948838 AW235336 AW172827 AA095289 BE046383 AI734240 W1 6699 A1660329 AI289433 AA933778 AW469242 M468838 AA806983 
AA625873 W78031 BE206307 AA550803 AI743147 AI990075 AA948274 M1 29533 AI635399 M605313 AI624669 AW59431 9 A1221834 AI337434 
AA307706 BE550282 AI760467 A1630636 A1221 521 AW67431 4 AW078889 AI933732 AI686969 Al 1 86928 AW074595 Al 1 27486 AL079644 
AI910815 H17814 AA310903 AW137854 T19279 AA026682 AA306035 AW383390 AW383389 AW383422 AW383427 AW383395 H09977 
AA306247 AA352501 AW403639 F05421 M224473 AA305321 H93904M089612 AW391543 AW402915 AW1 73382 AW402701 AW403113 
R94438 N731 26 H93466 AA090928 M095051 T29025 AW951 071 L47277 L47276 AI37591 3 BE3841 56 W24652 M746288 AA568223 BE090591 
H93033 N57027 AA504348 AA327653 AW959913 N53767 AA843715 AI453437 AW263710 AI076594 AA583483 AW873194 AW575166 AI128799 
AI803319 AL042776 AW074313 AI887722 AI032284 AA447521 AH 23885 N29334 AI35491 1 AW090687 AA236763 AA435535 AA236910 
AA047124 AA236734 AW514610 H93467 AA962007 AI446783 AA127259 AI613495 A1686720 AI587374 AA936731 AA702453 AI859757 
AA216786 AI251819 AI469227 AA806022 AI092324 N71868 M968782 M236919 AA809450 M227220 AA765284 AI192007 AA768810 
AA805794 AA729280 M806238 AW768817 N71879 A1050686 AA505822 AA668974 AI688160 BE045915 AW466315 AA731314 AA649568 
AA834316 AW591901 AW063876 AW294770 AI300266 A1336094 AI560380 AA721755 H09978 D20305 D291 55 AW821790 BE150864 F01 675 
AI457474 AW466316 M550969 AA630788 

BE561958 BE561728 BE397612 BE514391 BE269037 BE514207 BE562381 BE514256 BE514403 BE514250 BE397832 BE269598 BE559865 
BE396881 BE560031 BE514199 BE560037 BE560454 

AC004770 W05005 AA356068 M094281 H29358 T56781 AW875313 L37374 BE312466 BE311755 BE207106 BE293320 BE018115 AW239090 
BE548830 AW247547 AA776062 BE397382 AA48671 3 T101 1 1 T09340 AW498981 BE547280 AA356003 AW581 520 AW875331 AA580720 
AW875336 BE276873 BE408229 AW188148 BE255166 BE253761 AW793727 AW373141 AW581548 M471223 AA30595O BE263976 AA626820 
BE257409 AW360962 AA090655 C0031 2 BE31 2741 BE40721 3 AA209352 AW2981 99 AW248553 AW297794 AW731 722 BE300586 AW731 972 
AW615446 BE301599 AW615520 AA486714 AW440257 M196516 M564630 AA618079 AW192592 AW474985 AA604580 AI627461 AA765440 
AI680394 AL1 35548 AI683224 AI581 126 AW245096 AW194154 H29274 N70363 AA629758 AA580602 AA862006 AI863841 AI097667 AI928583 
AI358774 BE243487 AA620553 AA653297 AA292690 T101 10 Z38906 AA908544 AA340930 A11 85438 T03328 T28844 AI68701 0 AI864965 
AI872575 BE388740 T56780 AW373138 BE258717 AA699671 

AU076916 BE2981 10 AW239395 AW672700 NM.003875 U10860 AW651755 BE297958 C03806 AI795876 AA644165 T36030 AW392852 
AA446421 AW881866 AI469428 BE548103 T96204 R94457 N78225 AI564549 AW004984 AW780423 AW675448 AW087890 AA971454 AA305698 
AA879433 AA535069 AI394371 M928053 AI378367 N59764 A1364000 AI431 285 T81 090 AW674657 AW674987 AA897396 AW67341 2 BE063175 
AW674408 AI202011 R00723 AI753769 A1460161 AW079585 AW275744 Al 873729 D25791 BE537646T81139 R00722 
J04129 NM 002571 AA293088M477016 AA404631 T28299 AA476904 AA433965 AA430486 AA495907 AI151391 AA291495 AA402723 W25651 
AA70681 6 AI82671 2 AW296294 AA293479 AI276581 AW0441 54 AI0801 80 AI41 7985 A12741 68 AI47421 2 AA495908 M635664 AI0921 1 4 
A1804952 AA479874 AI597661 AI42051 1 AA479738 AA421417 AA421 247 AA436220 AL047797 M34046 N42277 AA228076 W02698 A1420297 
AA434011 AI369971 M479731 A1865541 AI41 8020 AA42 1246 AA452764 AL048051 

NM.006769 U24576 AW161961 AW160473 AW160465 AW160472 AW161069 AI824831 AW162635 AI990356 AW162477 AW162571 AI520836 
AW162352 AW162351 AW162752 AI962216 AI537346 AA853902 H17667 BE045346 BE559802 BE255391 AA985217M235051 AI129757 
AW366451 T34489 D56106 D56351 AI936579 AW023219 AW889335 AW889120 AW889232 AW889175 BE093702 AW889349 AA147546 
AI952998 AA91 2579 AI143356 AW90221 1 R64717 AW157236 AI81 5242 D45274 AW263991 AA442920 M1 29965 AL035713 AI923255 A1949082 
AI142826 AI684160 AI701987 AI678954 AI827349 BE463635 AW628092 AW302281 AA493203 BE348856 BE536419 AW193969 AW673561 
AW592609 AI224044 H43943 M091912 R49632 R48353 AI568409 R48256 AI198046 H27986 H43899 AI678759 AI680310 AI624220 H17052 
AA156410 N56062 AI699430 M664529 T09406 T10459 AA627506 AI379584 N83831 N88633 AW022651 AA971281 M248036 AI039197 
AI91 4689 AA973825 AL047305 AA129966 AI798369 AW264348 AI445879 AI658759 N67924 AI933507 AI216121 AI333174 T10972 AI375028 
AH 86756 AI273778 AA610487 AI797946 AA853903 AA903939 AI338587 AI278494 AW627595 AA904019 

M86849 AA315280 NMJ04004 AA315269 BE142653 AA461400 AW802042 BE152893 AW3831 55 AA490688 AW1 17930 AW384563 AW384544 
AW384566 AW378307 AW378323 AW839085 AA2571 02 AW378317 AW276060 AW271245 AW378298 AW384497 AI5981 1 4 AW264544 AI01 81 36 
AW021810 M961504 AW086214 AW771489 AW1 92483 AI290266 AW1 92488 AW384490 AW007451 AW890895 AA554460 AA613715 
AW020066 AI783695 AI589498 AI917637 AW264471 AW384491 A1816732 AW368530 AW368521 AW368463 AA461087 AI341438 AI970613 
AI040737 AI418400AA947181 AA9627 1 6 Al 280695 AW769275 AW02359 1 Al 160977 AA055400 N71 882 AA490466 AW243772 AW3 16636 
AI076554 AW51 1702 N69323 H88912 AA257017 AI952506 H88913 AI912481 M600714 BE465701 N64149 C00523 N64240 AA677120 
R61573 BE005029 X98091 AA297307 BE537267 BE566138 BE566139 F11561 BE564795 BE568776 AW064005 BE566479 BE380035 BE567012 
BE568634 BE566568 AA298060 BE566043 BE568813 BE568618 AA283070 BE565414 BE566738 BE568585 BE565667 BE566116 BE566433 
U62136 AF049140 BE567057 BE567297 BE567403 BE564316 BE567400 BE568854 BE566588 AA448772 M071363 AW732642 BE564996 
AA297763 AA278550 AA421 083 AA2981 84 AA091 007 AA984577 AA20591 6 N28759 AL031 291 C1 5757 C1 5761 H02728 BE566410 AA1 29335 
AA41 9499 N87741 BE379689 BE004824 BE37961 1 D25874 AA148454 AA323654 AW95031 1 AA448795 AW749423 AA773386 M773843 
AW020327 BE348580 BE504258 BE549990 BE220200 AI673334 AI202679 AA975515 D61421 AI168688 AA102843 AW246621 AI276203 
AI074054 AI633824 AI962927 AH 48926 N50969 AI30891 1 AA41 0994 AW373025 AA148455 H02620 AA688293 AI24631 8 N22220 AI91 7777 
AI050943 AI097286 AA663794 AW368662 AW627826 AW078734 AI253060 AA7491 54 AA832236 AI192358 AW024676 AA448676 AA764891 
BE439467 M661 534 AA258061 AI090546 AA995157 AI051 01 1 AA584421 AI026032 AW591 338 AW589563 AA776914 AW024684 AA421 002 
F09219 BE464500 A1383595 AA954244 AA601583 AA737304 M1 95549 AA805778 AI055876 AA1 64942 AW01 3961 A1672608 AW51 421 1 D59441 
AW582574 AA160935 BE566501 BE564612 BE565353 BE568195 BE565447 BE568302 BE566097 BE565470 BE564249 AL036217 AW749424 
BE567494M1 02842 AA31 4761 AV661237 C14211 AA651866 AW798997 AA470605 

AF112213 AL050318 T24804AW248136 BE386341 BE263177 W16677 BE250224 BE563669 BE267405 BE546577AV651354 AV651292 
AI346903 AI5391 28 Al 1 891 71 S83364 AW073849 AI81 6760 AW073309 AI422690 AA296692 AI860301 AI805446 N77735 AI340328 BE092530 
AW028742 BE088442 AA657742 AA742438 AW1 70086 AI038920 AI432379 N36073 AI9361 94 AA868655 AA98361 2 AI077505 BE080433 
AI37501 4 Al 1 26547 AI348244 AI346077 AI748952 N26915 AI753574 AI093341 AI278762 BE092517 N74204 H06158 T58149 AI129303 mB386 
AA524456 BE122661 AA542925 AI2461 20 A1735203 AA706829 AA877544 AI082289 M926687 N92840 AW249798 M934763 AW998363 
AI1 28632 N25202 AI240209 AW1 1 8892 N80744 R35655 AI342321 AI340141 AW878792 AI857321 H0961 0 W04601 AW006650 AA1 26006 
AA553675 AI052791 AW059835 AI041906 AA814658 AW002059 AA729483 AI609301 AA994633 AA903651 AI459183 T95072 AW088630 
AA1261 12 AI800091 AI561215 H17502 AW475072 AI819003 AI683272 AI262701 AW793140 T81787 R99586 AI275160 AI310420 AI698929 
M1591 74 AI827968 F30305 F30309 AA806662 A1091923 AW78722 AA583430 AW571 913 AI674584 AA292533 AI079471 AA642325 AA71 9050 
AW793172 AA305476 AW1 03745 T23459 N79525 AI784438 AA534551 AW193751 AI074360 BE281214 T32229 W25066 W01205 T63086 
AW795348 AI361287 AW795353 AW795349AA594759AI 400295 D11489 A1370689 AA482356 M485295 W40151 AA564661 AW300745 
AI346938 AI374975 AI423782 AW1 93899 AA612604 Al 1 83409 AA996156 AW366963 AW366977 AI284860 AA846503 AI985064 AA844576 
AA737921 AA873274 BE241546 BE241540 M484058 AW468970 AA1 27876 M159120 AW001568 AW795213 AW795258 AW795330 BE250589 
BE387572 AA910895 AA1 61 217 BE250380 W31 500 T951 67 AI719306 AI359224 

BE258778 BE281 230 BE41 0044 T33723 AW672694 AW410439 NM.006429 AF026292 T35505 BE542333 T08940 AU076737 AW247471 
BE393215 AW328640 BE542408 T32170 BE302544 T31955 BE206898 BE275738 T32570 BE386426 BE298746 BE389937 BE293991 BE315289 
BE389578 R34739 R15312 BE279365 BE277756 AL03601 9 T33725 BE277779 BE302962 AL047294 BE276505 T09070 T33673 BE312580 
AW387774BE257175 AW674367 BE253331 BE270344 BE299831 BE273576 T32062 AI751831 BE618381 AA304899 BE252268 U46364 
BE256790 BE207199 BE256209 BE251941 BE250791 BE313955 BE269806 BE543623 BE279212 BE252289 T31699 BE262220 T31669 
AA315781 AA192212 N84547 BE292737 BE259631 AA232179 A1133144 T31292 AA315945 BE407301 BE251184 BE409006 AI880158 AI904003 
AI904114 AW651768 AW651763 R58247 BE271897 U83843 C05298 BE261609 BE255973 AA351650 N84631 BE263637 AW452910 AA328465 
AA324549 AW579525 BE252296 BE257551 AL048332BE208630AA359336 AW327897AA151742 M305816 BE076862 BE076796 BE263161 
AA323785 AA676588 AA626565 AA078917 W87657 R09002 R94021 AA312032 BE276665 M295608 AW407162 M329374 AW877912 N27885 
M369256 AA360968 BE250476 N85427 BE265569 AI278639 AI816576 AI691037 AW328583 A1567949 AI983455 AI927732 AI81 1297 A1571508 
AW073674 BE296039 BE467326 A1828796 AI81 6578 AW51 1604 AI921213 AW1 52427 AI795787 AI801 61 8 AW168866 AI628144 AI890339 
AW173690 AW51 1540 BE535620 AA383014 BE301 164 AI866596 AW514909 AA658050 AW575243 AA074631 AI093488 AW575408 AW675443 
AW615636 AW732207 AW377638 M321 784 AA641 629 M633105 AA527640 AW129146 AW61 5672 BE394607 AA483902 AW475032 BE378532 



92 



119221 102947 J 



125831 

mm 

113195 



119861 
112973 



1522905J 

45743_3 

178688J 



238266 1 
4868J 



129402 
105936 



47367J 
260931J 



129466 2094_50 



WO 02/086443 PCT/US02/12476 

AA872808 AI469388 AW105268 BE047301 AW591843 AW41O066 AW517153 A1950495 AA746641 AI914878 AA873185 AI696911 AA548625 
AA91 1505 AA1 48762 AW674535 AI587329 BE328328 AW270348 AA158225 AW1 1 7705 AW474997 AW51 91 93 M614757 AW664383 AI082647 
AW590973 A147671 1 AA192213 N88741 BE464552 AW072679 AI453708 AA152166 AA805924 AI581078 AI125768 AW1 73484 AI961 980 
BE300766 AH 99698 A1636792 AW247333 AW272861 AA078818 AA15001 2 AA551 232 AA678821 AW873869 AW768266 AI66031 5 M319210 
AA814551 AA1 57994 M318886 AI582962 AW089224 AI356098 AI343694 AW072598 N21054 AI301249 AA742924 H17917 AW328584 . 
AW248898 AI751830 M907816 R08898 AW087989 AI828300 AA148596 AI269577 T33426 AA213571 A1973201 AA666279 R49612 AI573183 
AW799762 AW410068 AW769666 AI962097 AI475204 D57490 AW517531 BE245270 AW470008 T33427 AW005731 AI795795 T23753 AW272981 
T15747 AA552875 T23644 AW361289 AI758558 BE207435 AA876958 T03361 AA883569 F37533 AA582321 AW082524 R4221 2 AA973847 
T18900 M086202AI559867A1302418 M948667 AA745670 T08939T33724 T33722 BE621568 D57489 D25906 BE621151 F16510 C05966 
T35127 AA630427 A1933481 AA309426 AI918440 BE561854 BE618866 BE394675 BE296173 AW951687 BE383739 BE616141 BE312730 
BE535351 AW080575 BE313330 BE616664 AI354390 AA847315 BE544509 BE515212 BE297833 BE278808 BE544844 AW0901 78 Al 890664 
BE546708 AW189943 BE274412 BE382399 BE266392 BE254949 BE280696 BE383237 BE261756 BE257721 BE312683 BE275476 BE514880 
BE545314 BE313587 BE384537 BE386691 BE264813 AW592575 AI336332 A!£78641 AI795791 BE222662 AW2493 16 AA3 14361 AL036012 
AW402923 BE266845 AA075945 AA314436 BE384640 AW731769 AW957077 AA552234 AA573560 AW367038 AA313399 AI983873 BE410159 
BE263803 BE514339 BE409073 BE281296 BE543396 BE395387 BE088360 BE546946 BE546570 BE390626 AA074638 AA301821 AW845230 
AW582379 AI949222 AW029572 M515843 AW272394 BE250234 

C14322 W74050 AI074232 AA595624 BE048955 AH 4841 7 AI583145 AI473460 AI801688 AW573593 AI950741 AI628140 AW467921 R98105 
AJ149258 AI247584 AI078378 AI139850 AA48941 1 W24744 R98104 AI033826 AA699589 AI033120 N55544 W88984 AW970771 M703362 
M0991 38 AA706792 AA0461 50 H98981 AI91 6674 M95301 8 A1972749 AI921 343 M909044 AA094751 AI2031 24 AA582143 AI446654 
AW235415 R70377 M099236 F20703 AA524436 R69484 
H04043 D60988 D60337 
AI204246 AI204250 Al 194050 

H83265 T63524 AA304359 AW960551 A1672874 A1749427 AA227777 AW027055 M971834 T49644 T541 22 AI983239 AI808233 T91264 T96544 
AI350945 AI7091 14 R72382 T48788 R48726 AW38541 8 AI095484 T49645 AA928653 AA570082 AW007545 T57178 AA51 641 3 M91 31 18 T571 1 2 
AA564433 AA774503 AA367671 T59757 

W788 1 6 AI720806 AI633854 AI632086 AI668663 N70894 AW571 809 AI383592 AI201 348 W8071 5 N91 880 AW9631 01 AA33901 1 
AB033023 BE391906 BE275965 BE277872 BE003882 AA313774 BE019159 BE298024 BE299727 BE300011 BE390277 BE394764 N87550 
BE409419 BE408652BE408197AL119332AA622427AI816265AA610118T07318AA019839 AA634430 BE205794 BE049461 AI042322 
AI65271 1 AI917645 AA630045 AW191969 AI817882 T1 7271 AI803663 AI095533 H4601 9 AW592438 AJ624836 AI675552 D51 1 49 AW132058 
AA639614 AI925762 AW088153 T17455 AA018640 AW751475 BE300241 AI816255 BE391981 AW408671 AA353910 AW875446 AW875703 
AW875926 AW875645 AW875647 AW938037 AL1 38042 AW89261 9 BE24301 8 AW995454 BE246381 BE009082 BE278921 AW967842 AA262454 
H30121 

W72062 AF088057 W76255 AI82721 9 AI631461 AW449295 AI354957 AI91 3803 T62772 AI222040 T62921 T63781 
A1678765 H12175 R14664 AI914049 AA995383 H08009 H19418 AW953728 AI358021 AA587361 AI269377 M369905 AW957113 H27693 
AI300474 H73776 W74397 AA579604 AI131018 W72331 AI719085 AA568348 AI859045 AI814819 AI888714 BE467470 AW131268 H19419 
H27694AI342165A1914155AA534872 BE018176 R60206 H11647 R45641 AI860466 B E30 1656 AH 25453 AI498 120 M593735 AA8791 10 
A101 6404 T3501 8 AA588397 AW449767 AA470365 BE501 1 39 AA588354 AI337500 AW078532 Z41 279 AH 25449 AA935725 M404338 
L42583 NM.005554 L42601 BE1 83076 A1541221 BE1 40567 L4261 0 V0151 6 J00269 AW275792 AW383052 AW380143 AI541 1 02 BE612846 
AI541 344 AW238368 BE61 3405 BE61 5705 BE61 5530 BE61 5301 AW379823 AW794706 AA1 94806 AA1 94992 AW384024 AW384000 AA641 239 
AI246504 AI540333 AW238681 AA640939 AI540863 AI608860 AW862564 AW366725 AW368983 AW366870 AA596020 AW794721 AW79451 1 
A1591 1 81 BE1 82523 AW794644 AW794620 AI935234 AI608903 AI608623 AW797060 AW084935 BE182517 BE1 82319 AI890082 AW238346 
AW797012 BE182522 AW794838 AI608794 AW304289 AA1471 93 M595995 AW381 128 AW366720 AA583718 A1828416 BE122864 AW368343 
AA431080 AW082039 AW380976 AA587144 AA443636 AW872937 AW794448 AW378382 AW085761 AW794718 AW263895 M583587 
AA583991 M583994 AA586886 AA586880 AW368365 AI81 4460 AA586991 AI282829 AW378406 AA586721 AI609242 AA431 973 M232959 
AI831095 AW263854 AW378391 AW378415 AW378381 M036990 AW238395 A1285446 BE208219 BE049526 AA583605 AA583918 AW366711 
AI285580 AW082642 AI285712 AA582875 AW591216 AW36871 9 AW378408 BE1 22835 M582976 BE350422 AA41 8328 A1541454 AI565930 
AA583700 AA150575 AW238427 AI287474 AA912658 AA584223 AW238528 C17918 AW136169 AA159847 AI923797 A1609009 BE182479 
AI915198 AW3781 1 4 AA147179 M584239 AA1 50532 AW1 68862 AW085999 AW082480 M659742 AW079703 A1872793 AA583981 AI824571 
BE182316 8E182507AA233331 AI824572 AI540586 D29492 BE 182931 AA036948 BE551821 D29401 AW378365 C00141 D29181 D29567 
AW103359 W95238 A1991663 AA587298 BE184608 M099833 W95121 W95150 D29584 AI9341 1 1 D29456 D29533 AW265380 D29290 
AW238463 AA121041 D29204 AA595925 D29441 AW081840 AA587018 D29323 AA582891 BE182433 BE182437 BE158295 BE182434 
AW01 5534 AA31 4369 M290715 BE568683 AW629494 D28364 AW995678 

AI9071 14 AA580734 AL041945 M10151 5 M1 21 344 D781 30 NM.0031 29 AA341 650 T841 66 AF098865 AA1 30976 BE089553 
H05719 F13446 T66122 AW175590 F05344 A11 14790 R12900 AA194871 AA132298 D78129 AA132213 AW948930 AW948919 AA263053 AW946593 AW948840 
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Table 2A shows 504 genes down-regulated in lung tumors relative to normal lung and chronically diseased lung. Chronically diseased lung samples represent chronic non- 
malignant lung diseases such as fibrosis, emphysema, and bronchitis. These genes were selected from 59680 probesets on the Eos/Affymetrix Hu03 Genechip array. Gene 
expression data for each probeset obtained from this analysis was expressed as average intensity (Al), a normalized value reflecting the relative level of mRNA expression. 
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Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

90th percentile of Al for normal lung samples divided by the 80th percentile of Al for adenocarcinoma and squamous cell carcinoma lung tumor 
samples. 

median of Al for norma! lung samples divided by 90th percentile of Al for adenocarcinoma and squamous cell carcinoma lung tumor samples, 
median of Al for normal lung samples minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples divided by 
the 90th percentile of Al for adenocarcinoma and squamous cell carcinoma lung tumor samples minus the 15th percentile of Al for all normal 
lung, chronically diseased lung and tumor samples. 

average of Al for normal lung samples divided by average Al for squamous cell carcinoma and adenocarcinoma lung tumors, 
median of Al for normal lung samples divided by the 90th percentile of Al for adenocarcinomas. 

median of Al for normal lung samples minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples divided by the 90th 
percentile of Al for adenocarcinomas minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples, 
average of Al for normal lung samples divided by the 90th percentile of Al for squamous cell carcinomas. 

median of Al for normal lung samples minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples divided by the 90th 
percentile of Al for squamous cell carcinomas minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples. 
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Hs. 31 1662 


EST 


09613 


H47315 


Hs.27519 


ESTS 


109650 


R31770 


Hs.23540 


ESTS 


109682 


1 1 4 nrv -4 "7 

H18017 


Hs.22869 


ESTS 


09724 


D59899 


Hs.1 27842 


ESTS 


1 09782 


AB020644 


Hs.1 4945 


long tatty acyi-L.0A syntnetase z gene 


109833 


R79864 


Hs.29889 


EolS 


109837 


H00656 


Hs.29792 


bo IS 


109977 


T64183 


HS. 282982 


bo IS 


109984 


AI796320 


Hs.10299 


rpT, 

ESTS 


1 4 S\A AC 

110146 


LM 4 OOVt 

H41324 


Hs.olool 


bo i s, Moderately similar to 01 in 1 aain 1 b 


110271 


n289B5 


nS.31330 


to IS 


110280 


AW874263 


Hs.324b8 


rcTn 

to Is 


1 1 0420 


ono4 4 4 
R93141 


HS.1o4zo1 


to is 


110578 


T62507 


Hs.nodo 


to IS 


1 10634 


R98905 


ij_ ocnoo 
HS.o59y2 


to IS 


110726 


a \Aint4 04 0 

AW961818 


Hs. 24379 


potassium voltage-gated cnannei, snaKer- 


110837 


LinO'i no. 


HS.1Ub9ZU 


to t s, weaKiy similar to semapnonn r Ln. 


1 1 0875 


N35070 


HS.26401 


tumor necrosis tactor uigand) supenami 


110894 


Dry ooro 

R92356 


1)_ /»iJOD4 


to 1 s, Moderately similar to cytoplasmic 


♦ A /\n~7 A 

110971 


AI760098 


I 1_ r%4 AAA 

Hs.2141 1 


TOT- 

EolS 


\ a a r\*\i 

111023 


AV655386 


HS.7645 


to Is 


i A A A f 7 

111057 


T79639 


Lt_ 4 Aeon 
HS.1 4629 


rpTn 

EolS 


111247 


AW058350 


Hs. 16762 


Homo sapiens mKNA, cuna ur\rzpob*iD^Ub^ {j 


111330 


BE247767 


1 j_ 4 0 4CC 

Hs. 18166 


KIAAU8/0 protein 


t 4 4 Of A 

111374 


BE250726 


HS.283/24 


to is, Moderately similar to niA^ [n.sap 


1 a a A A n 

111442 


AW449573 


u_ 4 Q4 nno 
HS.1 81 003 


POTn 

to IS 


14 4 701 

111737 


un Acm 

H04607 


M_ no 4 D 

HS.9218 


cot. 
to IS 


4 4 4 ~? A ~t 

111747 


A1*7J| 4 jl"74 

AI741471 


Hs.2dbbo 


to IS 


111807 


R33508 


HS. 18827 


tSTS 


111862 


R37472 


1 1_ 04 ccn 

Hs.21559 


bSI 


I A OA A C 

I 1 2045 


A 1 170COO 

A1372588 


HS.8022 


1 U3A protein 


112057 


R43713 


1 k Ann 4 c 

Hs. 22945 


EST 


t A {~\t~\ A d 

112214 


a \a iA ^nnr*o 

AWT 48652 


Hs. 167398 


ESTs 


1 4 ooco 

1 1 2263 


R52393 


U« ocn4 1 
HS.2591 / 


bo IS 


l a tf\ n J A 

112314 


AW206093 


1 1 a^ *t An 

Hs.748 


rpT. 

ESTs 


112324 


R55965 


Hs. 26479 


limbic system-associated membrane protei 


112362 


AW300887 


Hs.26638 


ESTs; Weakly similar to UU20 receptor [n 


112380 


1 loon a f\ 

H63010 


1 c~r Af\ 

Hs.5740 


rpTi. 

ESTs 


112425 


a a nn jnr\n 

AA324998 


Hs. 32 1677 


ESTs; Weakly similar to !!!! ALU oUBhAMi 


112473 


R65993 


Hs.279798 


pregnancy specitic oeta-i -glycoprotein y 


112492 


N51620 


Hs.28694 


ESTs 


112541 


AF038392 


1 |_ 4 4 CC1A 

Hs. 116674 


EolS 


112620 


R80552 


1 1_ »inn>in 
HS.29040 


ho IS 


1 1 2623 


A V A ?OT O A f\ A 

AW373104 


HS. 25094 


holS 


1 4 OOC7 

112867 


Tno rye A 

T03254 


HS.1b/o93 


bo IS 


1 4 ion A 

1 1 2894 


TA0 4 DO 

T08188 


HS.6f (\J 


COTp 

bo IS 


112954 


AA928953 


Hs.bboo 


bo IS 


4 4 onin 

313029 


A \ A/HO 4 *74 (\ 

AW081710 


II— "70CO 

Hs.73b9 


COTp. \ft/^>oL-li/ Pimilnr \r\ UN Al 1 1 Ol IPCAMt 

bo 1 s f weakly similar to un alu ouorAMt 


113086 


A A *5 ACOnCt 

AA346839 


HS.2091U0 


UKr^r434L» I fi protein 


113140 


T50405 


HS.1759b7 


bSlS 


113252 


NM_004469 


1 )„ 4 4 nnn 

Hs.11392 


c-ios induced growth tactor (vascular en 


113257 


a mo4 >i~tO 

Al 82 1378 


HS- 159367 


ESTS 


113394 


T81473 


t 1— A "7*70A A 

Hs. 177894 


ESTs 


113437 


T85349 


Hs.1 5923 


r - nj 

EST 


1 1 3454 


A lAOn4 f& 

A1022166 


1 l_ 4 C4 OO 

Hs. 16188 


ESTs 


4 A Of 

113502 


T89130 




EolS 


113552 


AI654223 


HS.1 602b 


ESTS 


1 4 iff x c 

113645 


T95358 


n» 0004 Q4 

HS.3J31B1 


COT™ 

ESIS 


1 4 0 c>rs 4 

113691 


T96935 


Hs.1 7932 


COT 

EST 


4 A Trnr* 

113706 


AA004693 


li_ non4 nn 

HS.269192 


ESTs 


113883 


U89281 


4 4 QCQ 


oxidative 3 aipna nydroxysteroia aenyaro 


1 4 on ox 

113924 


BE1 78285 


nS.1 /UUob 


Homo sapiens mKNA, cuima UArzpooDDU^u (i 


1 1 4035 


W92798 


1 1_ oen4 0 4 
Hs.269181 


COT*. 

ESTS 


114058 


A 1/AAOAH r» 

AK002016 


■ i_ 4 4 J-70T 
Hs. 114727 


ESTs 


114084 


A A 7AAA^r 

AA708035 


Hs.1 2248 


ESTs 


(14121 


R05785 


Hs. 25425 


ESTS 


I A IJ A J 

114124 


W57554 


Hs.125019 


Human lymphoid nuclear protein (LAF-4) 


114275 


AW5 15443 


U#« OnC4 H7 

Hs.30b1 17 


mterleukin 13 receptor, aipna i 


114297 


AA1 49707 


li_ 4-Tonn4 

Hs. 173091 


DKFZP434K1bl protein 


A A A A 

114427 


A A nH'74 -to 

AA01 71 76 


t 1 — . nnrnn 

Hs.33532 


ESTs; Highly similar to Miz-1 protein [n 


114449 


AA020736 




"ze63b11.s1 Soares retina N2b4HR Homo sa 


114452 


AI369275 


Hs.243010 


ESTs, Moderately similar to RTC0_HUMAN G 


114609 


AA079505 




n zm97a5.s1 Stratagene colon HT29 (#93722 


114648 


AA101056 




n zn25b3.s1 Stratagene neuroepithelium NT 


114731 


BE094291 


Hs.155651 


Homo sapiens HNF-3beta mRNA for hepatocy 


114762 


AA146979 


Hs.288464 


ESTs 
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2.40 
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10.00 

8.40 
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6.49 



44.20 
28.40 



3.13 



5.33 



32.40 
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9.00 



8.00 
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2.49 
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35.00 
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7.00 
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6.00 



2.31 



30.40 
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7.00 
6.00 



14.00 



PCT/US02/12476 



2.11 



10.00 



3.44 
2.92 



40.80 
54.40 



29.40 



8.00 



107.00 



32.00 



56.80 



44.60 



2.75 
2.22 



3.48 



20.00 



4.15 



17.14 



4.58 



3.42 
3.91 



33.20 
53.00 



3.91 



2.74 
4.92 



13.00 
14.00 



29.80 



4.53 
3.62 



12.00 



4.39 
4.47 



10.00 



3.72 
3.60 



3.88 



2.58 



38.20 



3.09 



13.00 



5.00 



40.60 



48.80 



10.00 



3.45 



3.13 



35.40 



3.42 



33.00 



97 



WO 02/086443 



114776 


AA151719 


Hs.95834 


ESTs 


115009 


AA251561 


1 1 A /% r> ^» 

Hs.48689 


r~ /"I ~~r~ 

ESTs 


115272 


AW015947 




jT~» -W— 1 ft) ft 11 1 •■ ft! J 1 I* ft ft J 

ESTsrWeakly similar to hypothetical L1 


115279 


AW964897 


Hs.290825 


ESTs 


115302 


AL109719 


Hs.47578 


ESTs 


115365 


AW976252 


* | A AAA A J 

Hs.268391 


ESTs 


115559 


AL079707 


Hs.207443 


ESTs 


115566 


lift M A 

Al 142336 


Hs.43977 


ESTs 


115683 


AF255910 


ft 1 f - ft y\ •* /-\ 

Hs.54650 


ESTs, Weakly similar to (deflme not ava 


115744 


AA418538 


11 A t"\ S\ A r* 

Hs.43945 


ESTs; Highly similar to dJ1 178H5.3 [H.sa 


115819 


M486620 


11 A A A r\ r— 

Hs.41135 


Endomucm 2 


115949 


ft ft ft ~ * « ft j^^v 

AI478427 


Ik A *~\ A s> r* 

Hs.43125 


ESTs 


115965 


AA001732 


Hs. 173233 


ft - ^"T* 

ESTs 


116035 


AA621405 


Hs.1 84664 


ESTs 


116049 


M454033 


it j j j j 

Hs.41644 


ESTs 


116081 


Al 190071 


Hs.55278 


ESTs 


116082 


AB029496 


Hs.59729 


ESTs 


116213 


AA292105 


Hs.326740 


i * » * • * * f*i in • t ■■ 

leucine rich repeat (in FLU) mteractin 


116228 


AI7679A7 


Hs.50841 


ESTs; Weakly similar to tuftelm [M.musc 


116250 


N76712 


Hs.44829 


ESTs 


116419 


AI613480 


Hs.47152 


I ft ft 11 ft •! ft ft 1* .1 ill* 

ESTs; Weakly similar to testicular tekti 


116617 


D80761 


Hs.45220 


EST 


116784 


AB007979 


Hs.301281 


tenascm R (restnctm; janusin) 


116835 


N39230 


1 1 aha j n 

Hs.38218 


ESTs 


116970 


AB023179 


Hs.9059 


1 #\ ft ft aaaa -.Jt— 

KIM0962 protein 


117023 


AW070211 


It j An j > j - 

Hs. 10241 5 


ESTs 


117027 


ft ft A )ft fAi t — y"\ A A 

AW085208 


Hs.1 30093 


ESTs 


117036 


H88908 


t i J A A a 

Hs.41192 


EST 


117110 


M160079 


Hs. 172932 


ESTs 


117209 


W03011 


Hs.306881 


ESTs 


117325 


N23599 


Hs.43396 


ESTs 


117454 


N29569 


Hs.44055 


ESTs 


117475 


N30205 


ft 1 j»» M ft r% 

Hs.93740 


ESTs 


117543 


BE219453 


ft ft A ^"v *h *v 

Hs.42722 


ESTs 


117567 


AW444761 


Hs.44565 


ESTs 


117570 


N48649 


Hs.44583 


ESTs 


117600 


N34963 


Hs.44676 


EST 


117730 


N45513 


1 1 .J 4* A M. 

Hs.46608 


ESTs 


117791 


ft ft J A #% m 

N48325 


Hs.93956 


EST 


117929 


N51075 


Hs.47191 


ESTs 


117990 


AA446167 


Hs.47385 


ESTs 


118224 


N62275 


Hs.48503 


f— #Ak.«« 

EST 


118244 


N62516 


Hs.48556 


ESTs 


118357 


AL1 09667 


11 A i-\ A A r~ A 

Hs. 1241 54 


Homo sapiens mRNA full length insert cDN 


118446 


N66361 


Hs.269121 


ESTs 


118447 


N66399 


ft 1 1 J #-\ A 

Hs.49193 


EST 


118530 


N67900 


It J J ft ft r-V 

Hs. 118446 


ESTs 


118549 


N68163 


ft 1 A AMAA ^ * 

Hs.322954 


EST 


118823 


W03754 


Hs.50813 


hftfe 11 ft ftl ) * r 1 1 

ESTs; Weakly similar to long chain fatty 


118862 


W17065 


Hs.54522 


ESTs 


118935 


AI979247 


Hs.247043 


1 S 1 ft ft ^ ^ r" 1 ft 

KIAA0525 protein 


118944 


AI734233 


Hs.226142 


— _ — , - - amft ft 1 ft •■ ft nil 1 1 t | ^% | f» ft ■ J 1 

ESTs; Weakly similar to !!!! ALU SUBFAMI 


118995 


N94591 


ft ft V A ^ A. 

Hs.323056 


ESTs 


119073 


BE245360 


Hs.279477 


^— _ a a— y» Jftftft ♦ a | ft ft 1 ♦ 

ERG-2/ERG-1; V-ets avian erythroblastosi 


119268 


T16335 


Hs.65325 


EST 


119514 


W37937 




ft ft i ft* _ j ft • 1 ft _ 

Accession not listed in Genbank 


119824 


W74536 


ii j j~ ^ 

Hs.1 84 


i ii i i ■ . i i i ^_ • 

advanced glycosylation end product-speci 


119831 


AL1 17664 


1 ft C t^i M A /~\ 

Hs.58419 


DKFZP586L2024 protein 


119861 


ft ft 1 ■ ^% M J A 

W78816 


Hs.49943 


ESTs; Moderately similar to !!!! ALU SUB 


119889 


W84346 


Hs.58671 


r - t~\ v t" 

ESTs 


119921 


W861 92 


Hs.58815 


ESTs 


120082 


H80286 


Hs.40111 


ESTs 


120094 


AA811339 


Hs.1 24049 


ESTs 


120132 


W57554 


Hs.125019 


Human lymphoid nuclear protein (LAF-4) 


120378 


AA223249 


ft ft *\ m-+ 

Hs.285728 


ESTs 


120404 


AB023230- 


Hs.96427 


ft M ■ ft > A .~\ A 1 ft 

KIAA1 01 3 protein 


120504 


AA256837 




ESTs 


120512 


N55761 


Hs.1 94718 


ESTs 


120667 


AA287740 


Hs.78335 


microtubule-associated protein; RP/EB fa 


120777 


AA287702 


ft 1 A A 

Hs. 10031 


| > | ft ft JKK«*» | ft 

KIAA0955 protein 


121082 


AA398722 




ESTs 


121191 


ft ft A fS. A. ^» ^ 

AA400205 


Hs.104447 


ESTs 


121248 


ft ft J A J A 

AA400914 


Hs.97827 


EST 


121363 


AI287280 


Hs.97933 


ESTs 


121366 


AI743515 




ESTs 


121483 


AI660332 


1 1 r\ /- s — r ft 

Hs.25274 


ESTs; Moderately similar to putative sev 


121518 


M412155 




ESTs 


121545 


ft ft A A r\ a m r\ 

AA412442 


ft ft /S j M A 

Hs.98132 


ESTs 


121622 


AA416931 


Hs.1 26065 


ESTs 


121665 


AA416556 


Hs.98234 


ESTs 


121709 


AI338247 


Hs.98314 


Homo sapiens mRNA; cDNA DKFZp586L0120 (f 


121730 


AI140683 


Hs.98328 


ESTs 


121740 


M421138 


Hs.98334 


EST 


121772 


AI590770 


HS.1 10347 


Homo sapiens mRNA for alpha integrin bin 


121821 


AL040235 


Hs.3346 


ESTs 



34.40 
30.20 
32.60 



6.00 



31.40 



3.18 



50.60 



6.00 



3.06 
3.85 

* 2.27 



47.20 



49.40 



8.67 



44.00 



16.00 



6.00 
9.00 

8.00 



31.40 
32.80 



30.80 



2.40 
2.28 



3.94 



14.00 



31.40 



2.75 



29.00 



6.00 
12.00 



39.40 
33.00 

41.60 



2.29 



34.80 
38.80 

36.20 



9.00 



7.00 



48.00 
56.20 

33.60 
74.40 

388.80 

33.20 

45.80 



30.00 

41.20 
91.00 
32,60 
30.60 



29.20 



33.00 



52.60 



33.80 
30.03 



36.60 



46.60 
39.00 



30.20 
34.80 
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121835 
121841 
121885 
121888 
121938 
121950 
122030 
122054 
122211 
122233 
122247 
122253 
122266 
122285 
122409 
122485 
122697 
122772 
122831 
122913 
123049 
123076 
123136 
123309 
123455 
123691 
123756 
123802 
123837 
123844 
123936 
123987 
124013 
124160 
124205 
124226 
124246 
124348 
124358 
124409 
124442 
124468 
124479 
124519 
124711 
124866 
124874 
125097 
125179 
125200 
125299 
125400 
125810 
126176 
126303 
126403 
126507 
126773 
127307 
127462 
127486 
127572 
127609 
127832 
127898 
128073 
128101 
128149 
128212 
128333 
128364 
128426 
128598 
128634 
128687 
128726 
128773 
128833 
128870 
128878 
128885 
128998 
129000 
129038 
129098 



AB033030 

AA427794 

M934883 

AA426429 

AA428659 

M429515 

M431310 

M431725 

AA300900 

M436455 

AA436676 

AA436703 

M436840 

AA436981 

AA446830 

AA524547 

AA420683 

AW1 17452 

AI857570 

AI638774 

BE047680 

AI345569 

AW451999 

N52937 

M353113 

AA609579 

AA609971 

M620448 

AI807243 

AA938905 

NM 004673 

C21171 

AI521936 

R40290 

H77570 

AA618527 

H67680 

AI796320 

AW070211 

AI814166 

AW663632 

N51413 

AB011130 

A1670056 

NMJJ04657 

AI768289 

BE550182 

AW576389 

AW206468 

AW836591 

T32982 

AL110151 

H00083 

BE242256 

D78841 

AW629054 

AL040137 

M648284 

AW962712 

AA760776 

AW002846 

AA594027 

X80031 

AW976035 

M774725 

AW340720 

AA905730 

NMJJ12214 

W27411 

W68800 

N76462 

AI265784 

AA305407 

AA464918 

AW271273 

A1311238 

NM.004131 

W26667 

H39537 

R25513 

AF134803 

W04245 

M744902 

AW1 56903 

AW580945 



Hs.300670 
Hs.1 04864 
Hs.98467 
Hs.98463 
Hs.98610 

Hs.98724 

Hs.98746 

Hs.98849 

Hs.98872 

Hs.98890 

Hs. 104936 

Hs.98907 

Hs.121602 

Hs,99081 

Hs.160318 

Hs.98321 

Hs.99489 

Hs.5120 

Hs.1 05328 

Hs.211869 

Hs.1 90046 

Hs.1 94024 

Hs.102679 

Hs.1 12497 

Hs.112724 

Hs.1 12795 

Hs.112893 

Hs.120017 

Hs.241519 

Hs.95497 

Hs.107149 

Hs.1 24685 

Hs.108135 

Hs.1 90266 

Hs.270962 

Hs.10299 

Hs.1 0241 5 

Hs.1 07197 

Hs.285625 

Hs.109284 

Hs.1 27436 

Hs.137274 

Hs.26530 

Hs.304389 

Hs.127826 

Hs.335774 

Hs.103118 

Hs.1 031 56 

Hs.102720 

Hs.128797 

Hs.2441 

Hs.125976 

Hs.23964 

Hs.1 87584 

Hs.126712 

Hs.293977 

Hs.105468 

Hs.191788 

Hs.530 

Hs.292396 

Hs.128970 

Hs.1 25983 

Hs.1 28254 

Hs.177576 

Hs.336920 

Hs.12126 

Hs.269152 

Hs.145197 

Hs.102308 

Hs.23767 

Hs.1 04476 

Hs.1051 

Hs.1 84581 

Hs.75309 

Hs.10683 

Hs.1 801 41 

Hs.107761 

Hs.1 07767 

Hs.108124 

Hs.330466 



ESTs 2.34 

ESTs 2.61 

ESTs 

ESTs 

ESTs 

EST 

ESTs 34.40 
EST 

ESTs; Moderately similar to bithoraxoid- 49.40 
EST 29.80 
EST 

ESTs; Weakly similar to hypothetical pro 9.00 

EST 

EST 

ESTs 30.80 

phospholemman 2.65 

Homo sapiens cDNA FLJ 1 41 03 fis, clone MA 1 5.00 

ESTs 6.67 

ESTs 

ESTs 

ESTs 

ESTs 35.80 

ESTs 

ESTs 

ESTs 

ESTs 

EST 35.40 
Homo sapiens clone 24760 mRNA sequence 58.00 
ESTs 

olfactory receptor; family 7; subfamily 2.63 

ESTs 29.00 

ESTs; Weakly similar to GLUCOSE TRANSPOR 

ESTs; Weakly similar to PTB-ASSOCIATED S 28.40 

ESTs 

ESTs 

ESTs 2.35 
ESTs 

ESTs 17.00 
"yw35g1 1.s1 Morton Fetal Cochlea Homo sa 3.07 
ESTs 

TATA box binding protein (TBP)-associate 2.48 
ESTs 

calcium channel; voltage>dependent; alph 

ESTs; Weakly similar to SPLICEOSOME ASSO 2.50 

serum deprivation response (phosphatidyl 59.20 

ESTs 8.00 

ESTs 

ESTs 

ESTs 

ESTs 

ESTs 

DKFZP586D0824 protein 
ary) hydrocarbon receptor-interacting pr 
K1AA0022 gene product 
HUM525A05B Human placenta polyA+ (TFuji 
ESTs; Weakly similar to metaltoprotease/ 
ESTs; Weakly similar to HC1 ORF [M.muscu 
ESTs 

ESTs; Weakly similar to plL2 hypothetica 
aa59b04.s1 NC)_CGAP__GCB1 Homo sapiens c 
ESTs 9.00 
ESTs 2.36 
ESTs 
ESTs 
ESTs 
ESTs 

ESTs 7.33 
mannosyl (alpha-1;3-)-glycoprotein beta- 

glutathione peroxidase 3 (plasma) 3.09 
ESTs; Weakly similar to LR8 [H.sapiensJ 

ESTs; Weakly similar to ZINC FINGER PROT 1 0.00 

ESTs 
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TABLE 2B shows the accession numbers for those primekeys lacking unlgenelD's for Table 2A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession; Genbank accession numbers 



Pkey 

108447 
108550 
108655 
102397 
126303 
125810 
103627 
121366 
114609 
115272 
108338 
108434 
123302 
102310 
102636 
104776 
120504 
113502 
108499 
101308 
108629 
103098 
103241 
103508 
103575 
119514 
121082 
128634 
105817 
121518 
114449 
114648 
121950 
107723 



CAT number Accessions 

43452_-7 AA079126 

1 20073 J M084867 AA084996 

127522J AA099960 AA113013 

4437L-1 U41898 

1525933J D78841 D78880 

1554054.1 H00083R81062 

2615.2 Z48513Z48512 

280401 J AI74351 5 AA40561 7 AW276706 

1 1 6777 J AA079505 AA079537 

172113J AW015947 AA21 1890 AA279425 

112186 1 AA070773AA070774 

1 1401 2 J AA078899 AA078782 AA075788 

genbank.AA620448 AA620448 

NOT_FOUND_entrez_U33839 U33839 

entrez_U67092 U67092 

genbanl^AA026349 AA026349 

genbank AA256837 AA256837 

genbank T89130T89130 

genbank_AA083103 M083103 

entrez_L41390 L41390 

genbank_AA1 02425 M1 02425 

221.215 M86361 Z26593 X02850 D13070AE000659 M17649 M87869M87871 X61077 M16286 AF018169 X61079S59351 X60142 AF043169 

entrez_X76223 X76223 
entrez_Y10141 Y10141 
entrez_Z26256 Z26256 
NOT_FOUND_entrez_W37937 W37937 
genbank_AA398722 AA398722 
AA464918_at AA464918 

AA397825 
M412155 
AA020736 
M101056 
M429515 
M015967 



genbank_AA397825 
genbank_AA412155 
genbankJW)20736 
genbank„AA101056 
genbank„AA4295l5 
genbanleAA015967 
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Table 3A shows 452 genes up-regulated In chronically diseased lung relative to normal lung. Chronically diseased lung samples represent chronic non-malignant lung diseases 
such as fibrosis, emphysema, and bronchitis. These genes were selected from 59680 probesets on the Eos/Affymetrix Hu03 Genechip array. Gene expression data for each 
probeset obtained from this analysis was expressed as average intensity (Al), a normalized value reflecting the relative level of mRNA expression. 



Pkey: Unique Eos probeset identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 

R1: 80th percentile of Al for chronically diseased lung samples divided by the 90th percentile of Al for normal lung samples. 

R2: 80th percentile of Al for chronically diseased lung samples divided by the 90th percentile of norma! lung samples, squamous cell carcinomas and 
adenocarcinomas 

R3: 70th percentile of Al for chronically diseased lung samples minus the 15th percentile of Al for all normal lung, chronically diseased lung and tumor samples 



divided by the 90th percentile of normal lung samples, squamous cell carcinomas and adenocarcinomas minus the 15th percentile of Al for all normal lung, 
chronically diseased lung and tumor samples 
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4] A T 4 

10.71 






4 ,4 J r*A A 

114518 


A i A M A A A at 

AW1 63267 


t i_ 4 nn 4 nn 

Hs. 106469 


suppressor of varl (S.cerevisiae) 3-like 
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NM_016929 


1 1 A A A A A 41 

Hs.283021 


Li * 1 > 1 _ _ li I _^ ^ I 1 r* 
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gb:ye12d01.s1 Stratagene lung (937210) H 




o Ar* 

8.35 




113288 


A! 076 838 


II— /4 nnn*7 

Hs.12967 


ESTs 


12.40 






113252 


NM_004469 


11 4 4 A A A 

Hs.11392 


c-fos Induced growth factor (vascular en 




4 A"? 

4.27 




I 4 n o. A n 

113238 


R45467 


\ t 4 n n n 4 A 

Hs.189813 


r— AT* 

ESTs 








113203 


AA743563 


11 4 n A A r* 

Hs. 10305 


ESTs 


A4 A A 

21.20 






113195 


i | nnnn a 

H83265 


1 1^ A A O 4 

Hs.8881 


PAT- l A if— — t„l. . — *— _ 1— A 4 4 A 4 jl n ti ■■ n nn «-> n * .rt * 

ESTs, Weakly similar to S41044 chromosom 






1.92 


113089 


T40707 


1 \ A*^AAAA 

Hs.270862 


r-» A "T* 

ESTs 


4 A A A 

14.33 






113076 


A F""nAA4AA 

AF033199 


1 1 A 4 A A 

Hs.8198 


zinc finger protein 204 




A A A 

6.00 




113009 


tao n n n 

T23699 


1 l in JA 

Hs.7246 


ESTs 




n An 

9.40 




112937 


a inn 4 c^aa 

AI694320 


1 1 A A A W~ 

Hs.6295 


■ — r>-r~ IAJ ll_ ♦ •■ 1 4 ^ A A A Al- 1* 

ESTs, Weakly similar to T17248 hypotheti 




41 A AA 

12.20 




t A AA A41 

112891 


-T-nnn n-r 

T03927 


1 1 _ nnni 1-7 

Hs. 293 147 


f~ AT— IIa.aImaaI.1.. *.-*! — m A— A 4 A A 4 A W 1* 

ESTs, Moderately similar to A46010 X-li 


10.57 






(12794 


A^A 4 A 

R97018 




L — • * »_ n A 4) A AT— it— 1 1* 1— . _. 

gb:yq74b08.s1 Soares fetal hverspieen 


AA AA 

26.60 






I A Ai^A 4 

112691 


r^n at n n 

R88708 


1 ! AAAA J *f 

Hs.220647 


ESTs 


4A A A 

15.33 






I 4 o^nn 

112602 


A l A IA A JA ir 

AW004045 


1 l_ n A A A A i" 

Hs.203365 


ESTs 


15.60 






1 4 AAAA 

112366 


a r-nn a n 4 n 

AF035318 


t l 4 n p*aa 

Hs. 12533 


Homo sapiens clone 23705 mRNA sequence 


4 A 4 A 

15.40 






l A A a A a 

112210 


n J nn a ^ 

R49645 


l 1— «7A n 4 

Hs.7004 


m.T*_ 

ESTs 


4 A AA 

14.00 






1 41 t~\ f\ f\ 4 

112064 


Al AA^nnnA 

AL049390 


* 1 AAAAA 
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A A r*nn-rn4 

AA593731 


Hs.325823 


»J— J — - — I 1 — ■_— 'I — — 2— All It? Ml II 1 A kl A 

ESTs, Moderately similar to ALU5_HUMAN A 






j -7-7 
1.77 


f 11737 


1 lA J A Aw 

H04607 


■ 1 A A 4 A 

Hs.9218 


ESTs 






A A A 

1.86 


11605 


A 4 A A J 

T91061 


1 1 4 A A J MA 

Hs.1 94178 


A "A A A 1 il ■ • 1 j i— > .^v AAAA A*— . _» 

ESTs, Moderately similar to PC4259 fern 


nn nn 

23.00 






111510 


R07856 


Hs. 16355 


ESTs 


4 A AA 

11.02 






4 4 A 4 4 

11341 


A 1 4 r- — r 4 A A 

AL1 57484 


■ t A A AAA 

Hs.22483 


It * W—% A 1 A A\A 1 A A\> ✓^T^ TA Al A 4 A*** /J*^ 

Homo sapiens mRNA; cDNA DKFZp762M127 (fr 






4! A A 

1.88 


111280 


AA373527 


Hs, 19385 


CGI-58 protein 


4A J A 

18.40 






11247 


A t i (A r A n r - n 

AW058350 


11 4 A^vAA 
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Hs.133521 


ESTs 
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a at a a a 

107681 
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Hs.49136 
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107230 
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107029 
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AF 128847 
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Hs. 12592 


A AAA4 A 

106818 


A 1 ^A A A4 AC 

AK002135 


Hs.3542 


J A AT AT 

106797 


A 1 TA A A A A 

AI768801 
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Hs.1 26083 


4 A f~ A A A 

105986 


A HAT7700 

AB037722 


Hs.8707 


4 A r— n A A 

105894 


A 1 AA J T A A 

AI904740 
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ESTs 
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ESTs 
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ESTs 
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ESTs, Moderately similar to ALU7„HUMAN A 

EST 

DKFZP566F21 24 protein 
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Homo sapiens cDNA: FLJ21042 fis, clone C 
ESTs 

DKFZP434B203 protein 

gb:zj99f01 .s1 Soares_pregnanLuterus JIbH 

Homo sapiens beta-1 adrenergic receptor 

ESTs 

gb:EST00057 HE6W Homo sapiens cDNA clone 
Homo sapiens cDNA FLJ 10229 fis, clone HE 
KIAA0300 protein 

Homo sapiens mRNA; cDNA DKFZp434M229 (fr 
hypothetical protein FLJ10849 
succinate-CoA ligase, GDP-forming, alpha 
caveolin 1, caveolae protein, 22kD 
CD83 antigen (activated B lymphocytes, i 
flavin containing monooxygenase 2 
A kinase (PRKA) anchor protein 1 
RAS p21 proiem activator (GTPase activa 
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egf-Iike module containing, mucin-like, 
cadherin 5, type 2, VE-cadherin {vascuia 
UM domain only 2 (rhombotin-like 1) 
protein tyrosine phosphatase, receptor t 
progastricsin (pepsinogen C) 
CUG triplet repeat, RNA-binding protein 
CDP-diacylglycero! synthase (phosphatida 
signal transducing adaptor molecule (SH3 
amine oxidase, copper containing 3 {vase 
protein kinase C-like 2 
guanine nucleotide binding protein 11 
chemokine (C-X3-C) receptor 1 
steroidogenic acute regulatory protein 
spleen tyrosine kinase 
mannose receptor, C type 1 
myeloid ceil nuclear differentiation ant 
S1 00 calcium-binding protein A4 (calcium 
tachykinin, precursor 1 (substance K, su 
complement component 5 receptor 1 (C5al 
gb:Human alpha satellite and satellite 3 
coagulation factor VIII, procoagulantco 
hydroxyprostaglandin dehydrogenase 15-(N 
calcitonin receptor-like 
FBJ murine osteosarcoma viral oncogene h 
enhancer of filamentation 1 (cas-likedo 
microfibrillar-associated protein 4 
gb:Human dystrophin (dp140) mRNA, 5' end 
G protein-coupled receptor kinase 5 
transforming growth factor, beta recepto 
solute carrier family 6 (neurotransmitte 
Charot-Leyden crystal protein 
fatty acid binding protein 4, adipocyte 
S164 protein 

amyloid beta (A4) precursor protein (pro 
HIR (histone cell cycle regulation defec 
gb:Human nonmuscle myosin heavy chain-B 
KIAA0237 gene product 
sre homology three (SH3) and cysteine ri 
Down syndrome critical region gene 1-lik 

growth differentiation factor 10 
macrophage scavenger receptor 1 
hyaluronoglucosaminidase 2 
myocilin, trabecular meshwork inducible 
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18.80 
504.80 
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19.38 

15.40 
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14.80 
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1.76 
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1.75 
2.24 

2.01 
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4.00 
4.24 
6.20 
21.20 



5.40 
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TABLE 3B shows the accession numbers for those primekeys lacking unigenelD's for Table 3A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 



Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey CAT number Accessions 



123619 
126433 
125831 
126816 
126852 
121059 
120637 
122011 
120934 
123802 
116814 
118329 
104404 
104776 
113502 
101262 
108573 
101447 
124357 
108781 
112794 
100351 
100555 



371681.1 AA602964 AA609200 
127143 1 AA325606AA099517N89423 
1522905J H04043 D60988 D60337 
122973 1 AA248234AA090985 
136135J AA399961 M128347 
273450J M393283 AA398628 
200885.1 AA81 1 804 AA809404 AA286907 AW977624 
7617.-2 AA431082 
177521.1 AA226198M226513AA383773 

AA620448 
H50834 
N63520 



genbank.AA620448 
genbank_H50834 
genbank_N63520 
H58762_at H58762 
genbank_AA026349 
genbank_T89130T89130 
entrez_L35854 L35854 
genbank_AA086005 
entrezJ/121305 M21305 
genbank_N22401 
genbankJ\A1 28654 
genbank_R97018 
entrez_D64158 D64158 
tigr_HT2245 M69181 M81 105 U51039 



AA026349 



AA086005 

N22401 
M1 28654 
R97018 
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Table 4A shows 202 genes up-regulated In samples from patients treated with chemotherapy or radiotherapy. These genes were selected from 59680 probesets on the 
Eos/Affymetrix Hu03 Genechip array. Gene expression data for each probeset obtained from this analysis was expressed as average intensity (Al), a normalized value reflecting 
the relative level of mRNA expression. 

Pkey: Unique Eos probeset identifier number 

ExAccn; , Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 

R1 : average of Al for samples from patients treated with chemotherapy or radiotherapy divided by the average of Al for normal lung samples. 

Unigene Title R1 

chromosome condensation 1 27.20 

aldo-keto reductase family 1 , member C3 20.60 
KIM0042 gene product - 20.40 

glutamate receptor, metabotropic 5 20.60 

E2F transcription factor 3 29.40 

topoisomerase (DNA) II binding protein 23.50 

KIAA0874 protein 35.56 

S1 64 protein 43.40 

POU domain, class 3, transcription facto 21 .80 

gb:Human alpha satellite and satellite 3 193.60 

heparin-binding growth factor binding pr 38.40 

bullous pemphigoid antigen 1 (230/240kD) 198.80 

desmoglein 3 (pemphigus vulgaris antigen 78.60 

gap junction protein, beta 2, 26kD (conn 1 62.20 

nuclear autoantigenic sperm protein (his 50.00 

cytosolic ovarian carcinoma antigen 1 26.00 

UDP-N-acetyl-alpha-D-galactosamine:polyp 37.20 
mutS (E. coli) homotog 2 (colon cancer, 

RAR-related orphan receptor A 32.00 

ISL1 transcription factor, LIM/homeodoma 51.20 

deoxyguanosine kinase 13.90 

Homo sapiens cDNA: FLJ21800 fis, clone H 28.80 

preferentially expressed antigen in mela 1 1 0.60 

neurotensin 116.80 

enolase 2, (gamma, neuronal) 2.30 

matrix metal loproteinase 1 (interstitial 1 81 .40 

serum/glucocorticoid regulated kinase 49.20 

5T4 oncofetal trophoblast glycoprotein 86.60 

Homo sapiens mRNA; cDNA DKFZp564D016 (fr 42.60 

ESTs 29.40 

KIAA1488 protein 21.50 

hypothetical protein FLJ20287 32.80 

Homo sapiens PR02751 mRNA, complete cds 20.20 

paired box gene 5 (B-cell lineage specif 28.40 

downstream neighbor of SON 25.40 

ESTs, Weakly similar to I38022 hypotheti 32.00 
Homo sapiens mRNA; cDNA DKFZp761G02121 { 40.60 

ESTs 59.80 

ESTs 43.40 

phosphoserine aminotransferase 50.80 

gb:tk04g09.x1 NCI_CGAP_Lu24 Homo sapiens 53.40 

KIAA0922 protein 20.88 

DKFZP566F21 24 protein 23.60 

Homo sapiens mRNA; cDNA DKFZp762G207 (fr 57.20 

Ig superfamiiy receptor LN1R 49.00 

hypothetical protein 1 9. 67 

collagen, type XVII, alpha 1 48.17 

RAB6 interacting, kinesin-like (rabkines 59.20 

KIAA0863 protein 28.60 

hypothetical protein FLJ10493 22.80 
KIAA1702 protein 

ESTs 21.00 

trinucleotide repeat containing 9 31 .60 

ESTs 24.20 

hypothetical protein MGC5487 21 .40 

ESTs 20.40 

kinesin family member 1 3A 1 9.60 

ESTs 24.00 

HMT1 (hnRNP methyltransferase, S. cerevi 28.40 

zinc-fingers and homeoboxes 1 36.00 

PDZ domain containing 1 61 .20 

hypothetical protein 24.60 

ESTs 27.20 

LIS1-interacting protein NUDE1 , rat homo 48.00 

KIAA0942 protein 37.80 

CDC1 4 (ceil division cycle 14, S. cerevi 26.80 

solute carrier family 6 (neurotransmitte 63.80 

ESTs, Weakly similar to ALU INHUMAN ALU 26.40 

ESTs, Weakly similar to 155214 salivary 47.64 

ESTs 22.00 

hypothetical protein FLJ 10201 65.00 

Homo sapiens mRNA; cDNA DKFZp761J1324 {f 42.00 

microtubule-associated protein 1B 55.40 
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AA602964 




gb:no97c02.s1 NCLCGAP_Pr2 Homo sapiens 


ao on 

28.80 


j m, j a a A 

124006 


AH 471 55 


1 1 A'-TA a a a 

Hs.270016 


ESTs 


T~r <?n 

77.60 


4 rt A 4 A A 

124169 


BE079334 


t 1. A«Ti AAA 

Hs.271630 


ESTs 


00 on 
22.20 


124281 


A ft A A A""* A» M. 

AI333756 


ft I J J J M M A 

Hs.1 11801 


ft 1 A i * _ a r - 1 Al M 

arsenate resistance protein ARS2 


A A Art 

42.20 


A A J A A, 

124472 


N52517 


11 A A A rt "T A 

Hs. 102670 


A»^" 

EST 


OA A A 

32,60 


124617 


A % ■ I A A A V A A 

AW628168 


11 J Art A A* 

Hs. 152684 


j— a, *t* 

ESTs 


rt J A A 

21 .80 


124631 


fell a A A j| A ^ m Ai 

NM_014053 


1 ft A\wA^A A 

Hs. 270594 


A | A *A<AK ft » 

FLVCR protejn 


A A 4 A 

30.40 


J rt. J M M A 

124839 


p* A. A 

R55784 


11 J AAA AA 

Hs.140942 


1— Av A* 

ESTs 


a A A A 

21.20 


125186 


a A A J m A mm 

AA610620 


ll J A A A J 1 

Hs.181244 


* i^i i*i i i 

major histocompatibility complex, class 


A A rt rt 

42.80 


A A A A A J 

125321 


T" rt A A rt A 

T86652 


t 1 4 1AAA A 

Hs.1 78294 


ESTs 


Ck-f rtrt 

27.00 


j a r* A r" 

125535 


ikii M A A A A A 

NM_013243 


ft 1 A AA J A 

Hs.22215 


A 111 

secretogranin III 


AA A A 

23.80 


A rt r* rt j a 

125646 


A A A APiAi^A 

AA628962 


1 1 "T r A A A 

Hs.75209 


^. 1 * ft ^ 1 AlJn J. . _ AA^t^ . — A — A A a1> kli. 

protein kinase (cAMP-dependent, catalyti 


00 on 

23.20 


125684 


A 11 f f A A A A~7 

AW589427 


I i_ a i-nn A ft 

Hs.1 58849 


1 I_aaa aaa!af«m «P\ft 1 A . I~l 1 A 4 A A A X7 a mImma 

Homo sapiens cDNA: FLJ21663 fis, clone C 


0>1 OA 

21.20 


125724 


A 1 AAA i A A 

AL360190 


Hs.295978 


Homo sapiens mRNA full length insert cDN 


t n on 

48.80 


125847 


A1IJ<(AJ AAr* 

AW161885 


1 1 _ A A AAA A 1 

Hs.249034 


ESTs 


04 nn 

31.00 


4 A AAA A 

125934 


AA 193325 


II AAA A A 

Hs.32646 


hypothetical protein FLJ21901 


o«i on 

21.20 


126077 


A A — » rt —f ■•— » r- 1 

M78772 


ft 1 A J rtrtrtrt 

Hs.210836 


ESTs 


Art A A 

49.80 


126299 


AW979155 


Hs.298275 


* * 1 ■ ■ A 

amino acid transporter 2 


A A A A 

21.80 


126395 


A fl A i"\ ^ j-* M A 

AI468004 


ft ft A*vAAP*A 

Hs.278956 


ft A| !♦ ft > • |—i ft J A rt A A 

hypothetical protein FLJ 12929 


t J A A 

71.00 


126433 


AA325606 




ft r™Ai^rAA^A^ a* 1 ll 11 1 ft ft 

gb:EST28707 Cerebellum Ii Homo sapiens c 


A A Art 

23.20 


126509 


f-H A « A A M 

R47400 


ft 1 A. A A A 

Hs.23850 


ESTs 


A A A rt 

23.80 


126538 


A r~l A A M M #• 

AB030656 


ft 1 A — v rt ^ ^ 

Hs. 17377 


coronin, actm-bindmg protein, 1C 


AA A A 

23.10 


126666 


A A M A ^% A. 

AA648886 


1 ft J « A A A 

Hs.151999 


ESTs 


rt rt A A 

36.00 


126812 


AB037860 


Hs.1 73933 


nuclear factor I/A 


A A A A 

20.80 


126872 


1 1 J > J A A M •* >^ 

AW450979 




ft ft ftf ft ft I-J. I A 1 A A rt ) 11 -J A 1 rt| i A p» O*. 

gb:U(-H-BI3-ala-a-12-0-Ul.s1 NCI_CGAP_Su 


4 A AA 

46.29 


127046 


A A A A J A J A 

AA321948 


ft 1 A A rt rt. rt rt 

Hs.293968 


ESTs 


A A Art 

22.80 


127431 


A % A f ^ ^» A A A A 

AW771958 


1 ft A f r" A A^ 

Hs.1 75437 


A- A. *A ■ • ft 1 | ^ > 11 ft Ak A A A M A» • 

ESTs, Moderately similar to PC4259 fern 


Art AA 

30.00 


A A — * J A A 

127489 


A A A A A ^ A 

AA650250 


1 < a— r rt rt"^rt 

Hs.272076 


fA A, A- 

ESTs 


AA A A 

20.80 


127521 


A t A 1 A A >tA A A 

AW297206 


11 J rt A rt j rt 

Hs. 16401 8 


ESTs 


Ar" rtrt 

25.20 


A— ■ ^ A A 

127742 


A 1 A tnriA A Art 

AW293496 


11 A A rt J rt A 

Hs.180138 


ft - Aj*A 

ESTs 


00 nn 

28.00 


4 A~t a a r* 

1 27925 


a a an t?4 f~4 

AA805151 


Ua aaaa 

Hs.3628 


mitogen-activated protein kinase kinase 


on on 
21.20 


A A A A 

127930 


A A AAA A*tA 

AA809672 


1 1— 4 AAA A A 

Hs.1 23304 


ESTs 


Art CA 

20.54 


127968 


A A A A AAA A 

AA830201 


1 1 _ A A A A J —* 

Hs. 124347 


f" ftA)T_ 

ESTs 


00 on 

28.20 


127987 


AI022103 


11 A rt A r" A A 

Hs.1 24511 


ESTs 


A A AA 

19.60 


128116 


1 fA"TJ A A 

H07103 


ft ft AArtA A A 

Hs.286014 


ti * i it i a Ar* a n a-7 a a a pit i i. 

Homo sapiens, clone 1MAGE:3867243, mRNA 


Art A A 

20.40 


128609 


kill A rt rt rt ^ A 

NM_Q03616 


It A A A A ^rt 

Hs. 102456 


survival of motor neuron protein interac 


A A A A 

34.40 


128777 


a I rt *rr a a A a 

AI878918 


| 1 M AaAA 

Hs.1 0526 


cysteine and g[ycine-rich protein 2 


f— A A A 

53.80 


A A MM J A 

128949 


A A A rt A rt i — T 

AA009647 


1 1 AlA.b*A 

Hs.8850 


a disintegnn and metalloproteinase doma 


A A Art 

23.00 


129168 


All 32988 


Hs. 109052 


chromosome 14 open reading frame 2 


07 cn 
37,60 


129404 


AI267700 


Hs.317584 


ESTs 


28.60 


129527 


AA769221 


Hs.270847 


delta-tubulin 


40.80 


129574 


AA026815 


Hs.11463 


UMP-CMP kinase 


31.20 


129598 


N30436 


Hs.1 1556 


Homo sapiens cDNA FLJ12566 fis, clone NT 


29.60 


129785 


H19006 


Hs.1 84780 


ESTs 


72.20 


129970 


AV655806 


Hs.296198 


chromosome 12 open reading frame 4 


22.20 
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130149 


A ■ a ft Js. ^ai ^% *a* 

AW067805 


1 i A *Af A rt a r~ 

Hs.1 72665 


methylenetetrahydrofolate dehydrogenase 


29.60 


130199 


Z48579 


lb A »">AAAA 

Hs. 172028 


a disintegnn and metalloprotemase doma 


A-T A A 

27.60 


130441 


U63630 


Ik .at ^ A A A, T 

Hs. 155637 


protein kinase, DNA-activated, catalytic 


no OC 


130466 


W19744 


i 1 a A A A F— A 

Hs.1 80059 


Homo sapiens cDNA FLJ20653 fis, clone KA 


20.20 


A a a i r> 

130482 


A ■ A 1 J A A^ A J 

AW409701 


Hs.1578 


baculoviral IAP repeat-containing 5 (sur 


AO An 


J A A 4*\ A aa> 

130617 


a AAA. a* a A. 

M9Q516 


It ^ A ^ a 

Hs.1674 


glutamine-fructose-6-phosphatetransamin 


4 O CA 

iy,bu 


J AA.a>a#a.n. 

130703 


R77776 


Hs.18103 


ir+ 1—\ -r- 

ESTs ■ 


4n /a 
19.4U 


130732 


AW890487 


1 1_ A A A A 1 

Hs.63984 


cadhenn 13, H-cadnenn (neart) 


ti\ .4U 


130867 


NM_001072 


Hs. 284239 


UDP gIycosylU"ansferase 1 family, polype 


nu.uu 


131028 


it Ia^taw A*f" 

AI879165 


1 > AAA*7 

Hs.2227 


CCAAT/ennancer oinding protein (C/EBP), 


or on 

Zt).A) 


j a j jt\ a 

131086 


AL035461 


Hs.2281 


rtK-i it n lay n r-ift^ArnftA E J / A A A ^ A i A Al ■> A A 1 A 1\ 

cnromogranin d (secretogranin i) 


Aft fin 


j a a a a A 

131284 


tit i a a j i An 

NM_001429 


Hs.25272 


f™4 A L.!^.al!ft>.a> — .Oftft 

E1A binding protein p300 


^4.bU 


131775 


AB014548 


Hs.31921 


KIAA0648 protein 


zl.UU 


j /-\ u a a a 

131860 


BE383676 


Hs.334 


La a m ■ ■ « v« ■ v« ft>ai 1 ft^af a ailiiJ «a Ar^ A A A A f A A» A W I 

Kho guanine nucleotide excnange tactor ( 


JJ.4U 


131945 


Alma A AAAi A 

NM_002916 


It a r* a AA 

Hs.35120 


.1* At— £«ai.« i*S /aalltialaa A \ A /O"/ 

replication factor C (activator 1) 4 (37 


CA QA 


132040 


i ii ■ r\ s\ a a a a 

NM_001196 


Hs.315689 


Homo sapiens cuNA: rLJ z2o/o tis, clone n 


on ^n 

ZU.4U 


a a />rtn A 

132084 


AlA A AAAAl^ 

NM_002267 


1 1 AAAA 

Hs.3886 


karyopnenn alpha 3 (importin alpha 4) 


00 Af\ 


a a. a. a a A 

132389 


* a A A A AA A 

AA310393 


• ft A AAA j J 

Hs. 190044 


ESTs 


OO >1A 


132437 


AAA rA J /"} A 

AA152106 


Hs.4859 


cyclin L ania-6a 


07 >IA 

Z/.4U 


132550 


A 1 A fAi A A A r~ A 

AW969253 


Hs.170195 


bone morphogenetic protein 7 (osteogenic 


7c cn 


132617 


AF037335 


ft ft #— A AA 

Hs.5338 


carbonic anhydrase XII 


OH OC 
31 .00 


J y-w f-t A A, /-V 

132632 


AU076916 


Hs.5398 


guanine monphosphate synthetase 


00 >IA 

OZ.4U 


132672 


W27721 


Hs.54697 


Cdc42 guanine exchange factor (GEF) 9 


OO A{\ 


j o r\ -j A a 

132742 


a a nor j OA 

AA025480 


Hs.292812 


bSTs, weakly similar to i oo4oo nypotneti 


<?1 on 


132771 


Y 10275 


Hs. 56407 


phosphoserine phosphatase 


00 00. 


j a A A - 7 A 

133070 


t t a a a a rt 

U92649 


Hs.6431 1 


a _J j & J jL aft ^a a>b M rt i n n n l a| t a^ ft*% t b4 ^a ^a ^a jfH. Art 

a disintegnn and metalloprotemase coma 


oo Rn 


4 a a a f a 

133153 


AF070592 


Hs.66170 


HSKM-B protein 


on nn 


J A A i4 a- il 

133181 


\ff\A AAA 

X91662 


Hs.66744 


i-i • . I ~ i /PNa. An n n K if 1 i ii ii i j i 1 j-l i-ift / A A^yS A A A A A 1 A rt 

twist {Drosopniia; nomoiog {acrocepnaios 


oo fin 


133282 


M449015 


1 1 AAA 4 AC 

Hs.286145 


SRB7 (suppressor of RNA polymerase a, ye 


ci cn 


A f\ A A r— f~\ 

133350 


AI499220 


Hs.71573 


hypothetical protein FLJ 10074 


00 AA 


A a A ^ a a 

133592 


AV652066 


Hs.75113 


general transcription factor ll!A 


QO AA 

oz.UU 


133658 


ft 1 /\ J Hi j A 

AA319146 


|| — -» J A A 

Hs.75426 


secretogranin II (chromogranin C) 




133865 


AB011155 


ft ft A A A A A 

Hs. 170290 


discs, large (Drosophila) homolog 5 


69.33 


134032 


■ ft * _ [— \ *a A /"> ^ 

NM_005025 


1 t — t r\ t— a a 

Hs.78589 


serine (or cysteine) proteinase inhibito 


OO OA 


134125 


& ft a a j-K .ft Jft w A 

NM_014781 


Hs.50421 


KIAA0203 gene product 


oh en 

31 .oU 


134158 


U15174 


1 1 —t r"\ AAA 

Hs.79428 


BCL2/adenovirus E1B 19kD-interacting pro 


on ca 


134321 


BE538082 


Hs.8172 


T— A»f» »l J___l«al . b H . . 1_ A J A A J V It a 

ESTs, Moderately similar to A46010 X-lin 


oo An 


134367 


A A OOA A A fi 

AA339449 


Hs. 82285 


phosphoriDosyigiycinamioe Tormyitransier 


aq on 


134570 


U66615 


Hs. 172280 


SWI/SNF related, matrix associated, acti 


20.20 


134753 


NMJJ06482 


Hs.173135 


dual-specificity tyrosine-(Y)-phosphoryl 


20.80 


135002 


AA448542 


Hs.251677 


G antigen 7B 


37.60 


135029 


H58818 


Hs.1 87579 


hydroxysteroid (17-beta) dehydrogenase 


53.40 


135047 


AL134197 


Hs.93597 


cyclin-dependent kinase 5, regulatory su 


31.60 


135345 


X53655 


Hs.99171 


neurotrophin 3 


28.80 



TABLE 4B shows the accession numbers for those primekeys lacking unigenelD's for Table 4A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



CAT number 



Accessions 



Pkey 

123619 371681 1 AA602964 AA609200 

126433 127143 1 AA325606 AA099517 N89423 

126872 1 42696 J AW450979 AA1 36653 AA1 36656 AW419381 AA984358 AA492073 BE1 68945 AA809054 AW238038 BE01 1212 BE011359 

BE01 1367 BE01 1 368 BE01 1 362 BE01 121 5 BE01 1365 BE01 1 363 

106851 322947 1 AI458623 AA639708 AA485409 R22065 AA485570 

118720 genbank>73515 N73515 

120515 genbank_AA258356 AA258356 

117099 321871 1 H93699 H97976 H80036 

101447 entrez_M21305 M21305 

123130 genbank_AA487200 AA487200 
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Table 5A shows 680 genes up-regulated In squamous cell carcinoma or adenocarcinoma lung tumors relative to normal lung and chronically diseased lung. These genes were 
selected from 59680 probesets on the Eos/Afrymetrix Hu03 Genechlp array. Gene expression data for each probeset obtained from this analysis was expressed as average 
intensity (Al), a normalized value reflecting the relative level of mRNA expression. 



Pkey: Unique Eos probeset Identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title . , 

R1 : 70th percentile of Al for squamous cell carcinoma and adenocarcinoma lung tumor samples divided by the 90th percentile of Al for normal and chronically 

diseased lung samples. 

R2: 80th percentile of Al adenocarcinoma lung tumor samples divided by the 90th percentile of Al for normal and chronically diseased lung samples. 

R3: 80th percentile of Al squamous cell carcinoma lung tumor samples divided by the 90th percentile of Al for normal and chronically diseased lung samples. 

R4: 80th percentile of Al adenocarcinoma lung tumor samples divided by the 80th percentile of Al for squamous cell carcinoma lung tumor samples. 

R5: 70th percentile of Al for squamous cell carcinoma and adenocarcinoma lung tumor samples minus the 1 5th percentile of Al for all normal lung, chronically 

diseased lung and tumor samples divided by 90th percentile of Al for normal and chronically diseased lung samples minus the 1 5th percentile of Al for ail 

normal lung, chronically diseased lung and tumor samples 



Pkey 


ExAccn 


UnigenelD 


a ftftftftr? 

100035 






A ftftftft ft 

100036 






100037 


i 




100071 


A AOH AO 

A28102 




A f\f\A A A 

100114 


\/ftft ft ft ft 

X02308 


1 OAAAA 

Hs. 82962 


a ft ft A TT A 

100154 


i f a a~7 A A 

H60720 


Hs.81892 


J ftftA 0~7 

100187 


D17793 


U_ "7Q A 

Hs./oloo 


100188 


AW247090 


MS. 5/ 1U1 


100202 


BE294407 


HS.99910 


a aa A H a 

100216 


AA489908 


nS.1390 


100269 


NM_001949 


Un 4 4 on 

HS.1189 


100287 


A 1 f A*TAAC*7 

AL/076657 


Hs.1600 


A ft A A A"^ 

100297 


AU077258 


U_ j an a on 

Hs. 182429 


100330 


lit] J J ft ft ~7 ft 

AW410976 


Hs.77152 


100335 


AW247529 


Hs.6793 


100360 


l m l^ft A ~7 A 

W70171 


1 1 *7 f* A A A 

Hs.75939 


A ft ft ft ~y ft 

100372 


ttii ft A A-rftA 

NM_0 14791 


Hs. 184339 


100474 


tui ftftftftftft 

NM„000699 


1 1 ftftftftftft 

Hs.300280 


100486 


•T* A rt ft ft ft 

T19006 


i r _ a A A A A 

Hs.10842 


j} ft/t a ft a 

100491 


D56165 


I J ft~7^A A A 

Hs. 2751 63 


A ft ft r* A ft 

100516 


t*\ ft ftn*? ft 

D90278 


1 U il A\ 

Hs.11 


A ft ft r A a 

100522 


KM ^ A t~ ft A 

X51501 


1 1. AAA J A 

Hs.99949 


A ft f\ r~ r* tr\ 

100559 


k)ii ft ft ft ft ft A 

NM_000094 


kl. A ft A ft 

Hs.1640 


a ft ft ft 

100576 


\ //■% ftftt~ ft 

X00356 


Hs.37058 


A ft ft ft ft ft 

100629 


* a ftA r" ft ft ft 

AA015693 


It— ft A A A A 

Hs.21291 


A ft ft ft ft A 

100661 


BE623001 


1 r„ a A A~7 A O 

Hs. 132748 


A ft ft ft m T-1 

100677 


A A A*f AAflA 

AA353686 


11. 17-704 O 

Hs. 57813 


A A A A A A 

100696 


r\A inm 

D 14887 


Hs. 121686 


100709 


N26539 


Hs.1 00469 


A ft a -7 A A 

100761 


n i - irto Ar\4 

BE208491 


Hs.295112 


A ft ft ft ft ft 

100830 


A AAA A~f7f\ 

AC004770 


Hs.4756 


a ft ft n ft ^ 

100867 


U 14622 




a a a a a a 

100902 


1 MA A AAA 

M16029 


1 1 — AO"7A"7A 

Hs.287270 


A ft ft ft ft. ft 

100906 


A 1 1 A~ 7 A A A A 

AU076916 


Hs.5398 


A ft ft ft ft ft 

100960 


l ft ft A ft A 

J00124 


Hs. 117729 


A ft A ft A r** 

101045 


\ftr~ftA A 

J05614 




A ft A ft ft A 

101061 


ill i AAA 4 TC 

NM_000175 


Hs.180532 


A ft A ft~7 A 

101071, 


■ ft ft ft i r\ 

L02840 


\ \~ rj a ft A A 

Hs.84244 


A ft A 4 A jl 

101124 


L10343 


LJn 4 4 T3/H 

HS. 112341 


A ft A A *7r 

101175 


U82671 


A A A A A 

Hs. 36980 


A ft A A ft A 

101181 


t~ ft ft ft ft ft A 

BE262621 


l t« "7A*7nn 

Hs.73798 


101204 


L24203 


Hs.82237 


101210 


L29301 


Hs.2353 


101216 


AA284166 


Hs.84113 


101228 


AA333387 


Hs.82916 


101233 


AL135173 


Hs.878 


101273 


Z11933 


Hs.182505 


101342 


U52112 


Hs.182018 


101346 


AI738616 


Hs.77348 


101369 


NM_000892 


Hs.1901 


101396 


BE267931 


Hs.78996 


101431 


BE185289 


Hs.1076 


101448 


NM 000424 


Hs.195850 


101462 


AL035668 


Hs.73853 


101466 


BE262660 


Hs.170197 


101484 


AA053486 


Hs.20315 


101502 


M26958 




101505 


M307680 


Hs.75692 


101526 


NMJ)02197 


Hs.1 54721 


101535 


X57152 


Hs.99853 


101577 


M34353 


Hs.1 041 


101649 


AW959908 


Hs.1 690 


101663 


NMJJ03528 


Hs.2178 


101664 


AA436989 


Hs.121017 


101669 


L24498 


Hs.80409 



Unigene Title 

AFFX control: GAPDH 
AFFX control: GAPDH 
AFFX control: GAPDH 
Human GABAa receptor alpha-3 subunit 
thymidylate synthetase 
KIAA0101 gene product 
aldo-keto reductase family 1 , member C3 
minlchromosome maintenance deficient (S. 
phosphofructokinase, platelet 
proteasome (prosome, macropain) subunit, 
E2F transcription factor 3 
chaperonin containing TCPt, subumt 5 (e 
protein disulfide isomerase-related prot 
minichromosome maintenance deficient (S. 
platelet-activating factor acetylhydrola 
uridine monophosphate kinase 
KIAA0175 gene product 
amylase, alpha 2A; pancreatic 
RAN, member RAS oncogene family 
non-metastatic cells 2, protein (NM23B) 
carcinoembryonic antigen-related cell ad 
prolactin-induced protein 
collagen, type VII, alpha 1 (epidermolys 
calcitonin/calcitonin-related polypeptid 
mitog en-activated protein kinase kinase 
Homo sapiens ribosomal protein L39 mRNA, 
zinc ribbon domain containing, 1 
general transcription factor IfA, 1 (37k 
myeloid/lymphoid or mixed-lineage leukem 
KIAA0618gene product 
flap structure-specific endonuclease 1 
gb:Human transketolase-like protein gene 
ret proto-oncogene (multiple endocrine n 
guanine monphosphate synthetase 
keratin 14 (epidermolysis bullosa simple 
gb:Human proliferating cell nuclear anti 
glucose phosphate isomerase 
potassium voltage-gated channel, Shab-re 
protease inhibitor 3, skin-derived (SKAL 
melanoma antigen, family A, 2 
macrophage migration inhibitory factor ( 
ataxia-telangiectasia group D-associated 
opioid receptor, mu 1 
cyclin-dependent kinase inhibitor 3 (CDK 
chaperonin containing TCP1, subunit 6A ( 
sorbitol dehydrogenase 
POU domain, class 3, transcription facto 
interleukin-1 receptor-associated kinase 
hydroxyprostaglandin dehydrogenase 15-(N 
kallikrein B, plasma (Fletcher factor) 1 
proliferating cell nuclear antigen 
small proline-rich protein 1B (cornifin) 
keratin 5 (epidermolysis bullosa simplex 
bone morphogenetic protein 2 
glutamic-oxaloacetic transaminase 2, mit 
interferon-induced protein with tetratri 
gb:Human parathyroid hormone-related pro 
asparagine synthetase 
aconitase 1, soluble 
fibrillarin 
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TABLE 5B shows the accession numbers for those primekeys lacking unigenelD's for Table 5A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey 

117079 
124305 
101502 
109792 
126034 
102768 
126345 
127066 
127099 
119243 
125875 
112054 
126979 
126992 
122318 
114699 
114793 
108305 
108393 
100867 
123731 
109700 
120715 
113702 
115113 
101045 
108554 
108573 
119052 
126522 
126605 
103768 



CAT number Accessions 

1621717 J 
242183J 
18202.-6 
754958.1 
1598157J 
44641J 
1653833 1 
1703458 1 
244301.1 
1774795J 
1566433.1 
1538292J 
17141 1_1 
880655J 
29241 9_1 
135322.1 
150742J 
111550 1 
11341 1_1 
tigr_HT4586 
genbank_AA609839 
genbank_F09609 F09609 
genbank_AA292700 AA292700 
genbankj"97307 T97307 
genbankJ\A256460 AA256460 
entrez_J05614 J05614 
genbank_AA084948 
genbanMA086005 
149538.1 
416020.1 



H92325T97125 

AW963221 AA344870 M344871 H93331 
M26958 

R49625 F10674 
H60340N91637 
U82321 H66077 
N49713N49819W03810 
R25066 R20144 R20145 Z43845 
AA347668 AW956810 Z44271 F07065 F07064 R13506 
T12603T12604 
H14480 N98295 
R43590F10439 
M21 0954 AA21 1007 
A1809521 H12174242556 
M429743 AA442754 
AA1 27386 R1 5644 AA1 27404 
AA158245 AA1 58235 
AA071391 AA069892 AA069891 
AA075211 AA075245 AA075126AA074946 
U14622 

AA609839 



439280J 
46922J 



AA084948 
AA086005 
R10889 R10888 
W31912AI167491 
AA676910 AA778853 M778865 W86800 

W42667 AI580740 AI690440 AI561350 Am67906 AW151450 Af 825927 AL041 716 AI885600 AI742213 AW248624 AI955498 AA033947 
AA845593 AI62371 1 N68583 C00064 AA193567 AW083868 AW163216 M191595 AA522778 A1628008 AI915518 AA843508 AI926195 
AA176265 AW167963 AA9921 15 W93647 AW103572 AI862994 AI342059 AA91 1719 AA176155 AA024712 AA069988 AA205591 AI591 107 
A)199673A)811766AI275832A!422233A1191852AI096682AI580124AJ683612AA582453AA927559AA486415T32414AI084978 H44849 
H44848 H20477 T91 695 W47039 M070055 AA024795 AA328855 AA379248 M379330 M385580 W25920 W03688 AA448359 AA093881 
AW362477 AA089997 A1350265 W93479 N99688 M932257 AW351469 H68590 M663402 M069771 AW087986 AI858420 M600214 
AI970774 A1857712 AI683081 AI885584 AW131150 AI567981 AW002714AW1 89973 AW075495 AW168303 AA953714 AW516881 AI357375 
AI566663 AW51 2676 A1570580 AI023690 AA44821 6 AI079853 AI422707 M77951 6 AW026972 AW1 30082 AW1 62307 AW438646 AA709332 
AW192394 AI167350 AI217879 AI1291 52 AA719509 AI350480 AA66341 8 AI003634 AW1 1 8546 M1 80261 AA442833 AI268625 AA888881 
AI038759 AA846723 AI248770 AA993694 AI280335 AI885107 AW51 8649 M641 563 AA995835 AA582521 AI276744 AA436478 A1017360 
AI620763 A1859887 N73926 AI076327 AI741615 AI160617 AW1 72819 AI492005 M677429 AA996334 AI693771 AI950039 AI245629 AI288515 
AI8661 86 T93293 AA1 73262 AA599779 A1680092 AW43931 6 AI084555 AI272672 A1583507 AW47321 9 AA7381 32 AW473283 AI367492 
AA995410 AW89624 M206353 A1033095 AI040382 AA873630 AI221074 AI934840 AI418680 AA844306 R94503 AA773520 AA843169 
AA21 9425 AA629658 AI81 1 71 9 AW41 1 275 AI590981 W37907 AI591 178 AI684051 AA983238 AA669347 AA976239 M704570 AI628339 
AI884391 AI241580 A1003539 AW176687 AA009650 N34566 AI333493 AI186070 M070827 AA41 1683 AI280884 AA872023 AA207255 
AA021576 N71953 A1885888 AW076039 T15777 AI537673 AW248048 H09554 W93480 W47001 AW0791 14 AA063160 AA757453 R60788 
AI859431 H20478 AA218882 M757465 AA100995 AI864135 AI934209 AA070503 H47008 AA219646 W61039 W93907 AW385050 W37967 
W78028 M189007 M479136 R93650 M44231 2 T30287 AA847628 AA1 80262 AA009649 C03892 AW149464 AA310963 AA219693 
AA069747 R29207 AA094784 AA29361 5 AA447848 AI9841 67 N90393 C05097 N56499 AW292351 AW1 49681 AW473258 AA629322 AI004409 
AW105577 AI954937 AI81 1 070 AA902422 AW51 4437 AA535460AA91 6877 AW517122 AA974657 M975649 AW517130 AW517129 F31737 
W07688 AA193645 AA378994 M489273 F32267 W39303 AA021 181 N86810 M406524 AA062553 AA436801 H08985 H1 5979 N4031 0 
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AA436789 AA232172 AW360778 W25862 R60282 AA436530 AA378894 AA1 87461 AO40535 AA604210 AA0895U AA360421 N88243 N84281 
AA209340 N56174 N88374 AA191088 AW247691 AA249013 M0931 1 1 M972536 AW298594 AA375893 T12139 W28186 AW243849 
AI288629 AA843996 W15260 AH88286 AW248079 R15836 

1 1 9599 genbank_W45552 W45552 

112382 genbank_R59904 R59904 

105264 genbank_AA227934 AA227934 

100071 entrez_A28102 A28102 

123315 714071J M496369 M496646 



Table 6A shows 99 genes up-regulated nonsmokers with lung cancer relative to smokers with lung cancer. These genes were selected from 59680 probesets on the 
Eos/Affymetrix Hu03 Genechip array. Gene expression data for each probeset obtained from this analysis was expressed as average intensity (Al), a normalized value reflecting 
the relative level of mRNA expression. 



Pkey: Unique Eos probeset identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 

R1 : average of Al for samples from non-smokers with adenocarcinoma divided by the 90th percentile of Al for samples from smokers with adenocarcinoma 

R2; average of A) for samples from non-smokers with squamous cell carcinoma divided by the 90th percentile of Al for samples from smokers with squamous cell 
carcinoma 
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TABLE 6B show the accession numbers for those primekeys lacking unigenelD's for Table 6A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey CAT number Accessions 

108562 36375 1 AA 1 00796 AF020589 M074629 M075946AA1 00849 AA085347 AA1 26309 AA0793 11 AA079323 AA085274 

103439 35330 J X98266N41124 

123551 genbank_AA608837 AA608837 

123861 genbank_AA620840 AA620840 

102832 entrez U92015 U92015 

101972 entrez_S82472 S82472 

121558 genbank_AA412497 AA412497 
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Table 7A shows 98 genes down-regulated in non-smokers with lung cancer relative to smokers with lung cancer. These genes were selected from 59680 probesets on the 
Eos/Affymetrix Hu03 Genechip array. Gene expression data for each probeset obtained from this analysis was expressed as average intensity (Al), a normalized value reflecting 
the relative level of mRNA expression. 



Pkey: Unique Eos probeset identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 

R1 : 90th percentile of Al for samples from smokers with adenocarcinoma divided by the average of Al for samples from non-smokers with adenocarcinoma. 

R2: 90th percentile of Al for samples from smokers with squamous cell carcinoma divided by the average of Al for samples from non-smokers with squamous cell 
carcinoma. 
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TABLE 7B shows the accession numbers for those primekeys lacking unigenelD's for Table 7A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California), The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 

Pkey CAT number Accessions 

103207 30635_-4 X72790 

106566 120358J BE298210 AI672315 AW086489 BE298417 AA455921 AA902537 BE327124 R14963 AA085210 AW274273 AI333584 A1369742 AI039658 

AI885095 AI476470 AI287650 AI885299 AI985381 AW592624 AW3401 36 AI266556 AA456390 AI31 081 5 AA484951 

116571 genbank_D45652 D45652 

118466 genbank„N66741 N66741 

101046 entrez„K01160K01160 

101941 entrez_S77583 S77583 

103351 entrez_X8921 1 X89211 

123130 genbank_AA487200 AA487200 
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Table 8A shows 1720 genes either up or down-regulated in lung tumors or chronically diseased lung relative to a broad collection of over 40 distinct normal body tissues. 
Chronically diseased lung samples represent chronic non-malignant lung diseases such as fibrosis, emphysema, and bronchitis. These genes were selected from 39494 
probesets on the Eos/Affymetrix Hu02 Genechip array. Gene expression data for each probeset obtained from this analysis was expressed as average intensity (Al), a 
normalized value reflecting the relative level of mRNA expression. 

Pkey: Unique Eos probeset identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 

R1 : 70th percentile of Al for lung tumors divided by 90th percentile of Al for norma) lung 

R2; 70th percentile of Al for chronically diseased lung divided by 90th percentile of Al for normal lung 
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TABLE 8B shows the accession numbers for those Pkeys in Table 8A lacking unigenelD's. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 



322044 


187363.1 


AW340926 M249063 N86075 


322060 


44320 1 


AI341937 AW003063 U34725 AA904742 


321430 


42705 1 


X5741 4 X5741 5 


321467 


43034 1 


X1 3075X1 3076 


322125 


46779 1 


R93901 AF075073 R93902 


322166 


46861 1 


H69434AF085958H69846 


322173 


46873.1 


H52567 H52557 AF085970 H52164 


322178 


46882.1 


H56535AF085980H56712 


322179 


46885 1 


H92891 AF085982 H92777 


321577 


1615102 1 


H84849 H84252 H84260 H86664 H85320 


321587 


1615333 1 


H95531 H95521 H84529 


313723 


111953 1 


AA07041 2 M1 02346 AA081 885 


320997 


627492.1 


H22544H46842AI204929 


322278 


47271.1 


W69304AF086283 W69200 


321687 


218439 1 


AA625149 AA313030 AA313052 H97463 


313883 


129439 1 


AA665089 AA1 351 30 AA484059 M1 0241 9 AW877765 


322320 


47422J 


W79150AF086419 


322339 


814584J 


AI668646 A1734214 W17348 


3U648 


293660 1 


AW979268 M878419 AA431342 AA431628 


300201 


682222 1 


AI308300 AI308296 


306897 


25196_-2 


AI093967 


323155 


979809 1 


AL1 20701 AL1 35041 AL121524 


322527 


38927 1 


AF147359T58511T58560 


322585 


473768 2 


W88919W89125 


300362 


1574395 1 


242308 H23514 


322635 


82296 1 


AA005129 AA679084 AA694399 


322664 


85042.1 


AA011522 AA702841 M011691 AA330797 


315454 


380580 1 


A1239464 AI239473 AA625812 AI208703 


322687 


37372 1 


AF074666 All 10759 AF090902 


314852 


327472 1 


AI903735 AA491283 AI694953 AW976903 AA761362 


307783 


697809 1 


AI347274AW844024 


324072 


269032.1 


AA381722 AA381829 AW963906 AW963902 M381242 


300627 


221345J 


AA488472 W27363 AA317053 BE082689 AW967036 BE079872 


323505 


196389 1 


AW970512 AA280251 AI652287 BE466438 Al 650725 AA551 854 AA28 1574 AW57 1481 


315791 


403558 1 


AA678177 AA677034 


324303 


233842 1 


AL118754 M333202 H38001 


316519 


442885 1 


AA847835M768376 


300926 


333127.1 


AA504860 M504911 



Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 
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TABLE 8C shows the genomic position for those Pkeys in Table 8A lacking unigene ID's and accession numbers. For each predicted exon, we have listed (he genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 

Pkey: Unique number corresponding to an Eos probeset 

Ref: Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled "The DNA 

sequence of human chromosome 22." Dunham I. et al„ Nature {1999) 402:489-495. 
Strand: Indicates DNA strand from which exons were predicted. 

Nt_position: Indicates nucleotide positions of predicted exons. 
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Plus 


7695440-7695697 
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1. et.al. 


Plus 


7696625-7696707 


333772 
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ml ml 

. etal. 
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7706773-7706902 


333777 


Dunham, 


ml ml 

. et.al. 


Plus 


*7~r A cane TTAcnAd 

7746805-7746916 


1*3*1Q AC 

333846 
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1 mi ml 

1. et.al. 


Plus 


oftnocio annate? 

8008623-8008757 


333884 


Dunham, 


ml ml 

. etal. 


Dll.m 
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000007 
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. etal. 
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8154882-8155025 
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mi mt 

. et.al. 


Plus 
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. et.al. 
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nl,.. 
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. et.al. 
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G.CC34QC CCCIOOC 
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333966 
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. etal. 


Dll lm 
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ml ml 

. etal. 


Dl.im 
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8681004-8681241 


334061 


Dunham, 


mi ml 

. et.al. 


Dl.im 

Plus 


968b941 -9b87077 


OO /lAf) /I 

334094 


Dunham, 


ml ml 

. etal. 


Dl.im 

Plus 
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334113 
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. etal. 


Dl.im 
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. et.al. 
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20078117-20077991 



WO 02/086443 






334945 


Dunham 

UUI Jl 101 1 lj 


i et a! 

!■ Cl.dl. 


Mintic 
iviii iuo 


201 18885-201 1RR17 


334967 


Dunham 


I etal 

i. ci.di. 


Mimic 

IVIIIIUO 


2017331 1-2017121R 

•CU 1 1 OO 1 I'tCU 1 1 <J£. 1 O 


334990 

W W * J £J W 


Dunham 


1 pt al 

J. ci,di> 


Minuc 
lyjjiiuD 


90341 159-90141 0R7 


335091 


Dunham 

UUI II Idl 1 1| 


1 pt al 

la CL.Cll. 


Mini le 

IVIIIIUO 


91 9Q7367-91 9Q791 4 

C 1 l UU f £. 1 C.V / A It 


335988 


Dunham 

UUillldlll, 


1 at al 

1. Cl.dl. 


Minuc 

IVIIIIUO 


99304975-99101770 


335789 


Dunham 

UUI 11 Idl 1 1, 


( pf a! 

ii ci.di. 


Mini ic 

IVIII IUO 


22in5Q5n-92in57nfl 


11554R 


Dunham 
uui main, 


1 pt a) 

1. cl.dl. 


Minuc 
IVIIIIUO 


94669771-94RR9R71 

LtQO£l 1 O-<lH00«tO/ O 


335551 


Dunham 

UUI II Idl 1 1| 


1 pt al 

1. ci.di. 


Minuc 

IVIIIIUO 


9467QR9R-94R7RQR1 

£,*tU/ outO-^lHDf 03U 1 


335619 


Dunham 

uui ll idl 1 1, 


1 pt al 


Minuc 

IVIII IUO 


950R9677-950R949R 


335620 


Dunham 

uui ii iai i if 


1 Ptal 


Minuc 

IVIIIIUO 


95099561 -95099414 


335621 


Dunham 


1 eta! 

It wl«G*p 


Minuc 

IVIlI luO 


95098878-95098767 

aCUUC7UUr u tCwuJOi U( 


335682 


Dunham 

UUI II ICll 1 I, 


i et al 

1* CliUli 


Minuc 

IVIII 1 no 


95491 91 5-95491 091 


335755 

WWW* WW 


Dunham 

uui ii icii i if 


1 etal 

I* wl*GH» 


Minuc 

IVIII 1 uo 


25763806-95761747 


335814 

WW WW J *T 


Dunham 

UUUU ul 1 1 p 


1 etal 


Minuc 

Ivll 1 IUO 


26390043-2631 9845 

LUut^UUtJ i.UU 1 ou*tu 


335815 


Dunham 

L/UI II lull 1 1 


1 etal 


Minns 

IVIII IUO 


26320518-96390491 

LUU£VU lU'LUuLUtl. 1 


335835 

W W vU W V 


Dunham 

UUI II lul 1 l| 


1 etat 


Minus 

IVIII IUO 


26393311-26393245 

■C.WWWWW J rLUOiyjLnJ 


335851 

WW W W W J 


Dunham 

uui ii iai 1 1| 


1 et al 


Minuc 

IVIII IUO 


26604863-26604742 


335868 


Dunham 


1 pt al 


Minuc 


2671 1 417-2671 1 100 

iU/ J J*tU/ £.\JI 1 IUL/U 


335896 

www W w W 


Dunham 

UUI 11 ICll 1 1| 


1 pt al 

1. Cl.dl. 


Mini ic 

IVIIIIUO 


26977819-26Q77558 

c.\J<Jl 1 003 cXjdi iuuO 


335938 


Dunham 
uui ii iai 1 1, 


! at al 
ii oiidii 


Mini ic 

IVIIIIUO 


27160474-271R0400 


335948 


Dunham 

UUI II Idlll, 


1 pfal 
ii ci.di. 


Mint ic 

IVIII IUO 


27555Q24-275557R8 

£.1 vJJJjl.'ri.l uuuf OO 


336066 


Dunham 

UUI 11 lal 1 1, 


1 Pt al 

Ii Cl.dl. 


Mint ic 

IVIII IUO 


29241 080-29940849 


336906 

UUU4.UU 


Dunham 
uui ii icii ii, 


1 pt al 

I. Cl.dl. 


Mint ic 

IVIIIIUO 


10477456-1047711 1 

uui/ 1 Huu-UU'rf /Oil 


336975 

JJWL 1 W 


Dunham 

uui ll iai 1 1, 


1 pt al 
i> ci.di. 


Mfn 1 1 c 

IVIIIIUO 


190RR675-19nfl6516 


336292 


Dunham 

U Ul 1 1 1 QJ 1 1 1 


1 pt al 

i> ci.di. 


Minuc 
iviii iuo 


1981 R015-19R1 7997 


336331 

WW Www 1 


Dunham 

UUl II ICII 1 1; 


1 etal 

I* CLiuU 


Mini ic 

IVIII IUO 


11594597-11594171 


336419 

WWW*T 1 W 


Dunham 

UU 1 II 1 GH 1 1 , 


1 etat 

. ci.di. 


Minuc 

IVIII IUO 


34059568-14069445 

U*t UU .CU U O" U t UU it HU 


336675 


Dunham 

UUl II ICII 1 lp 


I etal 

II Cl.Oli 


Minuc 

IVIII IUO 


2020758-2020664 


336684 

WWWU U~ 


Dunham 

UUI 11 Idl 1 lp 


I et al 


Minuc 

IVIII IUO 


2158060-2157991 

£- 1 UUUUU 4. 1 Uf uuJ 


336716 

vvw/ 1 W 


Dunham 

L'UI II lul 1 lj 


I etal 


Minuc 

IVIII IUO 


3259952-3259R62 


336798 


Dunham 

UUI II lul 1 1, 


1 etal 


Minuc 

IVIII IUO 


5888954-5888757 


337043 


Dunham 

L'UI I1IOI lip 


1 et al 


Minuc 

IVIII IUO 


1 7407110-1 7407251 

1 » *tUl UUU" i 1 *tUI C.*J 1 


337046 

WW * U*tU 


Dunham 

UUl II Idl II, 


1 pt a] 

. ci.di. 


Minuc 

IVIII IUO 


17610892-17610821 

llul UUv7*v IIUI UUt 1 


337128 

OvJl 1 £U 


Dunham 

L/UJ II IOI II, 


pt a! 


Mimic 

IVIIIIUO 


22216951-9991 5014 

CCt- \ U«CU 1 CC C \ UUUt 


337192 

UUf 1 3t 


Dunham 

uu 1 1 1 iai i i, 


pt al 
. ci.dii 


Minuc 

IVIIIIUO 


9469 1 851-94591 771 


3371 94 

UU 1 1 O^T 


Di mham 
uut it iai i i t 


I pt a) 


Minuc 

1 Will IUO 


^4610510-94610159 

£.*1 U ( UU 1 U-t**U 1 UUUU 


337929 


Di mham 
uui mam, 


pt al 


Mini ic 
IVIII IUo 


9671 6579-9671 R4R1 

£SJI IU9r v7*t>Ui 1 OHO 1 


117195 

UU 1 U£U 


Dunham 
UUIIildl II, 


pt al 
. cl.dl. 


Mintic 

IVIII IUO 


1001 5Q4R-10M 5flnn 

UUU 1 UoHO-uUu 1 UOUU 


337497 


Dunham 

UUillldlll, 


at at 


Minuc 

IVIII IUO 


11171 117-1117195H 
uuu/ lulr-uuu/ iioo 


337500 

UU f 9UU 


Dunham 
UUI II Idl 1 1, 


pt al 
. ci.di. 


Mini ic 

IVIII 1UO 


1117R91 9-111761 5R 
uuur \j£. I c.- o jo / u 1 00 


337603 

UUf UUu 


Di mham 
uui ii iai u, 


pt al 

■ ci.di. 


Minuc 

IVIII IUo 


199999R-1999194 

I l33£90* I f-ZtZf 1 o*r 


337605 

UU I UUJ 


Dunham 
uui ii idi ii, 


et al 

, Cl.dl. 


Mini ic 

IVIIIIUO 


114R555-1 146197 


337671 


Dunham 

uui ii iai i i, 


pt al 


Mintic 


1960614-1960547 


337786 

WW 1 1 WW 


Dunham 

UUI II ICII 1 1, 


pt al 

. Cl.dl. 


Minuc 
iviii iuo 


41 11901-41 110R1 

*t 1 OUfcUu-*T 1 UOUO 1 


337862 

WW t UUl 


Dunham 

UUI 11 IOI 1 1, 


et al 


Minuc 

IVIII IUO 


5147668-5147660 

UU*tf uuu-uut/ UUU 


338083 


Dunham 

UUI fl ICt 1 t t 


et al 


Minuc 

fvilf IUO 


9318438-9318101 

ww I wTv(rvw I www i 


338158 

uwu I wW 


Dunham 

UUI 11 lul 1 lj 


et al 


Minus 

iviiiiuo 


11794465-11794143 

iii aftuu" 11/ utjtu 


338161 

WWW 1 W 1 


Dunham 

UUI II 1 CU 1 1, 


et al 


Minuc 

IVIII IUO 


12124716-12124658 


338182 


Dunham 1 

UUI II 1 Mil 1 , 1 


pt at 

• CLidl* 


Minuc 

IVIII IUO 


12824919-12824897 

l&ULti/ 1 U 1 £U£1l)£l 


338189 


Dunham 1 

UUillldlll, 1 


pt al 


Minuc 

IVIII IUO 


1 9878594-1 9R78478 


338199 

WWW 1 WW 


Dunham 1 

UUlllldlllf l 


pt a! 


Minuc 

IVIII IUO 


1 1760865-1 1760780 

IUf UUOUu- 1 U / ou/ ou 


338915 

www/. 1 U 


Dunham 1 
UUillldlll, 1 


et al 

i cl.dl. 


Mini ic 

IVIII IUO 


14056447-1 4055156 

CtuJUTt/ 1 HUUUUUU 


338469 


Dunham 1 

uuiiiidiii, i 


et al 

. ci.di. 


Minuc 
mil IUo 


90590187-90 590949 


338549 

wwWwHw 


Dunham 1 

UUillldlll! 1 


pf al 
. ci.di. 


Minuc 

IVIIIIUO 


92049 1 7 1 -2 904Q08 1 


338561 

wwUwU f 


Dunham 1 

UUillldlll, 1 


pt al 

■ Cl.dl. 


Minuc 

IVIII IUO 


2211 1966-9911 1856 

££u 1 t OUU ttO 1 IOUU 


338671 


Dunham 1 

UUillldlll, 1 


et al 

. Cl.dl. 


Minuc 

IVIII IUO 


9460R49 1-94508146 

tHJUOtfe 1 -fcHUUU JtU 


338676 


Dunham 1 

UUillldlll, l 


pt al 

• Cl.dl. 


Mini ic 

IVIIIIUO 


94617497-94617169 


338726 

wwWf 


Dunham 1 

UUI ll ICII II, 1 


pt al 

. Cl.dl. 


Mini ic 

IVIII IUO 


96996906-95^9561 8 


338779 

wwUI 1 O 


Dunham 1 
uuiiiidiii, i 


pt al 

. ci.di. 


Mini ic 

IVIII IUO 


97010161-97099796 

c.1 UuU 1 0 \-£.l U£9f uu 


338871 


Dunham 1 

UUillldlll, 1 


pt al 

. Cl.dl. 


Mini ic 

IVIIIIUO 


98101 70R-98101 611 

tOOU 1 / UO-C.QUU lull 


338872 


Dunham ) 

UUl It let ft, 1 


pt al 

t wl«Cflt 


Mmus 


28300921-28300790 


338966 

www wUU 


Dunham 1 

uui ii igi 1 1, i 


pt al 
. ci.di. 


Minus 


29614876-29614749 


339229 


Dunham 1 

UUillldlll, 1 


pt al 
. ci.di. 


Minus 


32722330-32722199 


339264 


Dunham 1 

UUillldlll, 1 


pt al 
, ci.di. 


Minus 


32975145-32975053 


325998 


6381940 


PI IK 


2630-2694 




325935 


6381943 


Mimic 


162154-162264 


3995RR 


3962484 


r iuo 


1169-1619 




399560 


3962491 


Pine 
r IUo 


2095-2990 




399541 


3983503 


Mini ic 


2765-3059 




395398 


5R66875 

UUUUU f u 


r Iuo 


86780-86854 




395340 


6017033 

UU 1 I uuo 


Mini tc 

IVllllUb 


166656-166819 


395373 


5866920 


Mini ic 

will |Ub 


1136686-1136777 


195167 


5866920 


Mini ic 


922881-922958 


325389 

U£.<JUUO 


5866921 

UUUU34 1 


r IUo 


239672-239759 


395436 


5866939 


Mini ic 
IVIII lUb 


29778-29907 




325498 


5866967 


Pine 


173372-173930 


325471 


6017034 

\J\J 1 t ww*t 


Mini ic 

IVIII IUO 


289268-289342 


325557 

w£»www r 


6056302 

w ww w w 


Pltlc 

1 IUO 


50921-51050 




325559 

Wi. WW WW 


6249595 

\J£tTf W W WW 


KMint ic 
iviii lu a 


118590-119172 


325560 


6249595 


Minus 


133794-133981 


325569 


6249599 


Plus 


79927-80217 




325587 


6682462 


Plus 


126724-126967 


325585 


6682462 


Plus 


73476-73574 




325597 


5866992 


Plus 


1065020-1065089 


325639 


5867002 


Plus 


253525-253608 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



WO 02/086443 




325739 

\JL-\Ji UU 


5867038 

OUU 1 www 


Minus 

IVll 1 lUw 


205138-205269 

C\J w 1 WU £.ww*_ ww 


325740 

\J£-\) 1 "TU 


5867038 

www/ www 


Minus 

IVll 1 JUw 


207533-207690 

Km\J t WWW £~\Jt WWW 


325792 

WLW 1 W*» 


6469828 


Minus 

1 V IN IUO 


1018-1176 

1 U 1 U 1 1 1 u 


325735 

vLv J WW 


6552447 

w W u £, T 1 1 


Minus 

|YI It 1 WW 


269122-269190 

fwWW 1 (— *— i—\J\J I WW 


325685 


6682468 

W W U£_~ W W 


Plus 

1 lUw 


117397-117483 

1 IIWW' 1 1 * i WW 


325686 


6682468 

WWW L"U W 


Plus 


118337-118439 

I 1 WWW 1 1 1 W I w w 


325819 


6682490 


Minus 

|V 111 IUJ 


130314-130370 

1 UUU 1 1 WWW 1 w 


329764 


6048195 

W W ~W 1 WW 


Minus 

IV 1 II IUJ 


109733-109968 

1 WW C WW iwwwww 


329703 

U(.v 1 UU 


6065793 

WW WW I WW 


Minus 

IVll 1 lUu 


139994-140138 

1 U w v v 1 TV IUU 


329643 


6448539 

W »~WW Ww 


Plus 


53403-53537 

W W I w w w w w w * 


329816 

U£»wU 1 U 


6624888 

UUfk*tUUU 


Minus 

\ Vlil IUJ 


70296-70423 

t WftkWW 1 w~»»u 


329860 

^/.wU U w 


6687260 

www/ AUU 


Minus 


163474-163605 

I WW «/ * i wwwww 


325883 


5867087 

Www 1 UU 1 


Plus 

1 1 U O 


22498-22663 

<_ t—\ WW ft- w w u 


325895 


5867097 


Plus 


358317-358476 

W W W W « 1 UUU i 1 u 


325925 


5867124 

WWW/ 1 


Plus 

1 IUO 


115749-115962 

1 IUI ~v 1 IWWW** 


325932 

Otv Jut. 


5867127 

uuu r i *s»i 


Plus 

1 IUJ 


7369-7441 

t www ■ « r i 


325941 


5867133 

WWW/ 1 WW 


Minus 

IVIII IUJ 


64228-64402 


325969 


5867153 

WWW / I WW 


Plus 

1 JUJ 


101911-102081 

IV / *r f 1 1 vi< W W 1 


325971 

U^W W 1 1 


5867153 

WW W r 1 WW 


Plus 

1 IUJ 


105841-106035 

1 w W W I 1 | W W W WW 


329993 

U^ww WW 


4567166 

"ww 1 1 ww 


Minus 

IVll* IUJ 


101307-101434 

1 W 1 WW 1 1 W 1 » w * 


330020 


6671887 

WW J I WW ■ 


Plus 

1 IUJ 


172397-172491 

I I 4- WW f || fcTtf 1 


326163 

W 4— W 1 W W 


5867168 

WW W 1 1 WW 


Minus 

IVIII IUW 


7831-8035 

■ WW 1 wwww 


326274 


5867171 

UUUl III 


Minus 

IVIII IUJ 


410289-410404 

I 1 w^ww ~ 1 w »^ w • 


326025 


5867176 

www t i « w 


Plus 


70854-70915 

/ W WW 4 f ww < w 


326046 

W t»U V t V 


5867182 

WWW/ 1 w*- 


Minus 


62668-62825 

WbWWW w«*Wpi»W 


326099 


5867186 

WUvl 1 UU 


Minus 

1 V 1 1 * IUJ 


661381-661510 

WWIWW4 WW! W 1 W 


326108 

I vu 


5867187 

WWW f IUI 


Minus 

IVll 1 IUJ 


23784-23903 

J^W 1 W i ^wwww 


326165 

V^V J UU 


5867208 

w V W / AiUU 


Minus 

9YH9 IUJ 


62787-62929 


326189 

Jlv 1 UU 


5867212 

www/ £. 1 £- 


Plus 

1 IUJ 


69288-69413 

WWfcWW WW~ 1 w 


326204 

W/-rU^U*T 


5867218 


Minus 

IVIII IUJ 


148088-148200 

l~WUWW | iwLUV 


326230 


5867230 

Www f £. w w 


Minus 

IVIII IUJ 


301868-301972 

WW 1 WWW WW Ivl 4> 


330052 


4567182 

*touf lot 


Plus 

1 IUO 


352560-352963 

U W*-W w W W WX> W WW 


330036 


6042048 


Pins 


117120-117216 

1 1 f 1 »- V 1 | 1 falV 


326360 


5867293 

UUUY fcWU 


Plus 

1 IUJ 


13627-13844 

1 vUt / ' WU77 


326589 


5867320 

WWW 1 ULU 


Plus 

1 IUJ 


22760-22919 

A—i— l WW *-t-W 1 w 


326393 


5867341 

WWW 1 W*T | 


Plus 

J IUJ 


41702-41841 

T 1 1 Wfc * 1 W » 1 


326505 


5867435 

UUU/ twu 


Minus 

IVIII IUJ 


8818-8949 

UU 1 W UWTw 


326515 


5867439 


Plus 

1 IUJ 


36683-36809 

wwwww wwwww 


326592 


6138928 


Plus 

1 IUJ 


23689-23828 

^wwww ^ w w** w 


330107 


6015249 

WW lUfiW 


Minus 


100091-100282 

• www w i luytv*. 


330106 


6015249 

UU 1 J<u"C 


Minus 

IVIII IUO 


99443-99778 

WW ■ * W WW 1 f w 


330100 


6015253 

ww | U<- ww 


Pius 

1 IUJ 


21166-21301 

t— 1 IWW i— 1 W W 1 


330093 

w w w V w w 


6015278 


Plus 

1 IUJ 


1043-1199 

1 U~W 1 * ww 


330088 


6015293 

WW I wi. WW 


Plus 

i IUJ 


37517-37638 

Uf U 1 1 W f www 


330085 


6015302 


Minus 

IVIII IUO 


5961 3-59770 

UUU 1 U UU f r w 


330120 


6671864 

WW 1 J ww*f 


Minns 


127553-127656 

I f WWW ( t* # WWW 


330123 


6671869 

UU # J Uww 


Minus 

IVIII IUO 


3531 1-35406 

UUU I 1 uu » vu 


326742 


5867611 

w w U / w 1 1 


Minim 

IVIII IUO 


95187-95248 

WW 1 W f w w** ♦ w 


326605 


5867637 


Plus 

1 IUJ 


24656-24749 


326818 


6117831 

Will Ww f 


Minus 

trill (Uy 


15199-15309 

» W 1 ww • WWW w 


326720 

u«-v f tv 


6552456 

wUUX»"Uw 


Plus 

1 IUJ 


84525-84677 

U *UtU W"W 1 1 


326770 


6598307 

UU wUvV/ i 


Minns 

IVIII IUO 


513603-513668 

U 1 Uw vu u I u w w w 


326692 

Wju W wi- 


6682502 

UUUAUU4 


Plus 

1 JU J 


117697-117899 

1 1 J WW J III www 


326693 

U£«U U w U 


6682502 

W U wLwUfH 


Minns 

IVJII IUJ 


335002-335095 

wwwww*— wwwwww 


326983 

W<- WW U O 


5867657 

WWW f W W 1 


Minus 

IVIII IUO 


16023-16581 

1 WV&aW \ WWW 1 


326991 

W^k. www 1 


5867660 

WW w f www 


Plus 


18147-18339 

»W I I / * wwww 


326936 

U £»U w U v* 


6004446 

WW WIT [U 


Minus 

1 VHI IUJ 


10217-10357 

1 W mm II I WWW 1 


326964 


6469836 

U~U UUUU 


Pius 

1 IUJ 


75340-75456 

1 ww~w # w » w w 


327040 

# w^U 


6531965 

U W W 1 uuu 


Plus 

J IUO 


783670-783817 

/ WWW/ W / WWW * 9 


327053 


6531965 

WuU | wUU 


Plus 

1 IUJ 


2247267-2247437 


327075 


6531965 

www I w w w 


Plus 

1 IUJ 


4041318-4041431 

l W ■ 1 W 1 w ~W~ i » W 1 


327085 

\J t— 1 UUU 


6531965 

www 1 wUU 


Plus 

f IUJ 


4734947-4735069 

~9 W * W 1 I ^» 1 wwwww 


327036 


6531965 

UJO 1 www 


Plus 

1 lUw 


319951-320040 

W 1 www » u*»vw~w 


327130 


6531976 

WWW 1 W ff W 


Plus 

\ IUO 


20247-22343 


327156 


5866841 


Minn ^ 


2462-2620 


327288 

W*- f LUU 


5867481 

w U w ' ■ U 1 


Plus 

1 IUO 


48583-48773 

"TUWUU tU 1 / u 


327332 

wi- 1 WW'- 


5867516 

WWW f U 1 u 


Minus 

IVll 1 IUO 


56361-56532 

WWWW 1 w w w w 


327220 


5867525 

WWW* W i- W 


M/nus 

IVIII IUO 


65701-65781 

WU i W 1 VU IUI 


327224 


5867534 

WWW/ W V J 


Plus 

1 IUO 


188468-188544 

i w w # w w i www~ r 


327321 

W4- i W*» 1 


6249562 

W*-~ w w w *- 


Minus 

IVIII IUJ 


99745-99836 

WW 1 i w wwwww 


327361 

w t- r W W ■ 


6552412 


Minus 

IV III IUJ 


61013-62130 

W 1 V 1 W W4L. 1 WW 


327396 

UJ*/ Uww 


5867743 

WWUf 1 lU 


Plus 

1 IUJ 


8702-8820 

WJ Wi» WW£_W 


327414 

Wi. 1™ 1™ 


5867750 

uuu i i ww 


Plus 

1 IUJ 


102461-102586 

1 w t» ' W 1 | w w w w 


327442 


5867759 

www/ f ww 


Plus 

1 IUO 


111483-111618 

III ~WW | 1 1 W 1 w 


327467 

W«p f ^ w / 


5867772 

UUU/ iff- 


Plus 


88030-88151 

WWWWW WW f W 1 


327473 

w£> l"l V 


5867775 

UUU ' ( (U 


Plus 

1 IUO 


75101-75181 

1 W 1 W 1 f w ■ W 1 


327483 


5867783 


Plus 


181573-181662 

1 U 1 Uf U IUI V w*» 


327377 

U t. luff 


5867793 


Mimic 

IVillfUO 


37610-37676 

UIUIU V 1 u / u 


32756? 

Otf Out 


UUU 1 out 


Mini id 


343989-344474 

U~UwUU U 1 I I 1 < 


327568 


5867811 


Minus 


46152-46287 

" v 1 U£» iwlUI 


327606 


6004463 


Plus 


200262-200495 


327611 


5867868 


Minus 


175063-175392 


327642 


5867891 


Minus 


2513-2743 


327654 


5867910 


Minus 


97564-97710 


327734 


5867940 


Minus 


31003-31583 



PCT/US02/12476 



150 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



WO 02/086443 




Q0777C 


bob/ yb4 


Pi h i n i i o 

Minus 


130791-130871 


32/ /9b 


obb^yoz 


Dine- 

rlUS 


85267-85405 


327840 


b249b/o 


Minus 


73065-73206 


330208 


buiobyy 


rtUS 


66517-66931 


ooUzbo 


bb/1oo4 


Minus 


101503-101634 


328U04 


bob/ yyj 


ft ill nt l 

Minus 


157407-157887 


3281 Ul 


cocanon 


rlUS 


289920-290014 


oZo lUU 


boboUA) 


Minus 


263545-263635 


ozollo 


bobbUZ4 


Minus 


80378-80491 


OOQI C7 


ooboUb4 


Pine 

rlUS 


73326-73615 




OODduOU 


minus 


16551-16729 


'30Q1Q7 


OuaOUu 1 


ft 4ijn 1 1 r- 

iviinus 


42133-42438 


Q07CMft 

oz/y4U 


CQCQ-t Q7 

boboiy/ 


ft Aim if 

Minus 


95240-95428 




OODOZ lb 


rlUS 


66611-66677 




byuz4oz 


Pine 
rlUS 


713478-714590 


32o0bo 


bl 1 /alb 


Dine 
rlUS 


253903-254022 


3282b4 


cam qio 


Pine 

rlUS 


55086-55404 


330300 


2yUbob2 


ft M IM ft 

Minus 


3246-3302 


328608 


58b8222 


Minus 


87770-87953 


328600 


5ob8229 


Minus 


38889-40010 


328610 


cocooon 
oobozoy 


DIi ip 

rlUS 


293920-294224 

<_ v i^_w ii**« • 


328623 


586824b 


Minus 


120020-120126 


OOOC30 

328b32 


bobo24/ 


rlUS 


76734-76853 


328bbb 


bbbbzb4 


ft jll r\t I ^ 

Minus 


778-901 


QOQCOQ 

oZobyo 


boboZb4 


ft A Ml 1 O 

Minus 


625555-625633 


3207UU 


ooboZb4 


Dlt ic 

rlUS 


764089-764203 


OOQ7fiQ 

OZO/Uo 


bobo^/i 


ft Jim iip 

Minus 


68114-68854 


dZo/ob 


OuDOtOy 


DIi ip 
rlUS 


89389-89455 


328/4.5 


oobo^ob 


Pine 
rlUS 


274638-274726 


o^ooUb 


bobooZn 


Pine 
rlUS 


29408-29684 




EQCQOCC 

ODDOJUD 


ft A i 1 1 1* 

Minus 


149708-149889 


328342 


boboobo 


DIi ip 

rlUS 


59955-60094 


3283bb 


bobo3o/ 


Minus 


270724-270798 


■5OQ0CO 

3283by 


bbboooo 


Dl i in 

rlus 


75371-75583 


328381 


bobo392 


Dim- 

rlUS 


662758-662848 


328451 


58b842b 


Minus 


217275-217336 


O^tO AO ■i 

328481 


COCOA ACl 

58bo449 


Minus 


8987-9180 

V^WWJ W t W w 


328500 


COCQ ACA 

58bo4b4 


rlUS 


59098-59481 


328530 


5obo4oi 


PL ip 

rlUS 


334973-335406 


32obb4 


bUU44/ J 


DL ip 

rlUS 


1193739-1193866 


QQQQC4 


booiy^o 


ft Jltn 1 h o 

Minus 


108317-108403 


328908 


bbbo4yo 


rlUS 


117002-117059 




OoutSbUU 


PI IIC 

rlUS 


771755-771889 


QOQQQvl 

OZoyo4 


oobooUU - 


DL ip 
rlUS 


846342-846448 


32 8y4y 


CA CR7CC 

b4bb/bb 


ft jl!n i in 

Minus 


43552-43619 


330313 


0U42UoU 


ft A i n itft 

Minus 


33642-33775 


o2yuub 


bbbob4z 


DIi ip 

rlUS 


85470-85673 


oonocc 
odUJbb 


29441 Ub 


Plup 
rlUS 


151837-151914 

9 *^ ■ W^# I 1 1 W ■ • 


3303/ 2 


bbBU4yb 


ft lin i ii> 

Minus 


317461-317688 


329033 


58b8bbl 


Minus 


5390-5479 


32903/ 


58bobb2 


ft Jl I 1 1 ^ 

Minus 


32466-32562 


329067 


5868591 


Minus 


146417-147652 

1 9 III -f 41 \J \M 


329134 


5obob/9 


DL ip 

rlUS 


29959-30018 

*»w WV'w www Iw 7 


nnni r-7 

329157 


COCQC07 

58b8b8/ 


Minus 


145940-146155 

9 1 VV IV 1 IW 9 \A 


329178 


58bo/U4 


DIup 

rlUS 


179177-179463 

9 1 W 119 ) 1 W C WW 


3291 92 


58bo/ lb 


Oil «r» 

rlUS 


166936-167020 


3<:yiy4 


bobonb 


ft n t n 1 1 r 1 

Minus 


304450-304559 


329204 


5868720 


Minus 


3050-3190 


329224 


5868728 


Plus 


27422-27664 


329228 


5868728 


Minus 


50118-50287 


329288 


5868771 


Plus 


25554-26299 


329337 


5868806 


Minus 


467155-467222 


329011 


6682532 


Plus 


48658-48741 



PCT/US02/12476 



151 



WO 02/086443 

TABLE 9A: Potential Therapeutic, Diagnostic and Prognostic targets for Therapy of Lung Cancer 



PCT/US02/12476 



Table 9A shows about 1312 genes up-regulated in lung tumors (including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid 
tumors) relative to normal body tissues. These genes were selected from about 59680 probesets on the Eos/Affymetrix Hu03 Genechip array. 

Table 9B show the accession numbers for those Pkey's lacking UnigenelD's for table 9A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 9C show the genomic positioning for those Pkey's lacking Unigene ID'S and accession numbers in table 9A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: 
ExAccn: 
UnlgenelD: 
Unigene Title: 
R1: 

R2: 



Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

Average of lung tumors {including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid tumors) divided by the 
average of normal lung samples 

Average of non-malignant lung disease samples (including bronchitis, emphysema, fibrosis, atelectasis, asthma) divided by the average of normal lung samples 
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lengsin 


Q C"7 


Q7 AA 

o/.UU 


a r\ f\ t— t\ 

400560 




Nlvi w 030o78 .Homo sapiens cytochrome r4bu, 


"\ AA 


•1 nn 

I.UU 


400664 




kill /\ ^\ A J ri[*,| 1 _ n. mmm»^vm*% m'w> a|mi, ■ /st/s|f /\r\M/> 

NM_002425:Homo sapiens matnx metailopro 


zu.zb 


/c: nn 

40.UU 


400665 




NM_002425:Homo sapiens matrix metailopro 


l.ob 


4 A7 
l.U/ 


400666 




NM_002425:Homo sapiens matrix metailopro 


O.ZO 


O 09 


400749 




tit j AAn«(Ar#.iJ^--iA Mnn ! A nA ^. _4;t: « _ ^ i « i _ -j 

NM_003105 :Homo sapiens sortilin-related 


4 nA 
I.UU 


qi nn 
yi.uu 


400763 




Target Exon 


T RQ 
/.DO 


94 nn 
^.uu 


401027 




Target Exon 


1 AA 
I.UU 


-1 AA 
I.UU 


401093 




C1 2000586 :gi|63301 67 Id bj | B AA8 6477. 1 1 (A 


1 AA 
I.UU 


ice nn 
lob.UU 


401203 




Target Exon 


1 AA 
I.UU 


pr nn 
oo.uu 


A (\ A O A O 

401212 




CI 2000457 :gi|751zl /o[pir|ll oUdd/ poiypr 


1 nn 
I.UU 


Ann nn 
hUU.UU 


try A A A A 

401411 




ENSP00000247172 :HYrL;IHbllL/AL izb.^KUa 


1 nn 

I .UU 


79 nn 
/ z.uu 


401435 




C14000397 :gij749S89o[pir(|Md295 hypotn 


4 AA 

I.UU 


Ri4 nn 

04.Uu 


A ry A j a 

401464 


AF039241 


histone deacetylase 5 


Q QO 
O.Ol 


AO. AA 

4».UU 


J i"\ A — » A A 

401714 




ENSP00000241802 :CDNA I-LJ11007 Ho, CLUN 


O AO 


yin nn 
4U.UU 


A f\ A -T A ~7 

401747 




Homo sapiens keratin 17 (KRT17) 


•10Q y(0 


rq nn 
bo.uu 


401760 




Target Exon 


1./4 


OR AA 
OO.UU 


401780 




NM_005557 :Homo sapiens keratin 16 (foca 


OR /t7 


in CA 
lU.&U 


i r\ a -rn A 

401781 




Target Exon 


■1 A OO 

lU.oo 


A R1 

4.01 


401785 




kill AAnATPt.l -. n 1 ... i' ^ c /l/DT'l 

NM_002275 :Homo sapiens keratin 15 (KRT1 


4.1o 


O 7A 

z. /U 


401797 




Target Exon 


i AA 
1.44 


9 in 

Z. IU 


401961 




NM_021626:Homo sapiens serine carboxypep 


1.41 


1.86 


401985 


AF053004 


class l cytokine receptor 


1.00 


177.00 


401994 




Target Exon 


61.84 


47.00 


402075 




ENSP00000251056*:Plasma membrane calcium 


1.00 


1.00 


402260 




NM_001436*:Homo sapiens fibrillarin (FBL 


1.58 


1.39 


402265 




Target Exon 


2.09 


35.00 


402297 




Target Exon 


1.00 


92.00 


402408 




NM 030920*:Homo sapiens hypothetical pro 


28.87 


13.00 


402420 




C1000823*:gii10432400(emb|CAC10290.1|(A 


1.00 


1.44 


402674 




Target Exon 


7.44 


243.00 


402802 




NM_001397:Homo sapiens endothelin conver 


1.00 


70.00 


402994 




NM_002463*:Homo sapiens myxovirus {influ 


1.37 


1.43 


403137 




NM_005381*:Homo sapiens nucleolin (NCL), 


1.00 


19.00 


403306 


NMJHJ6825 


transmembrane protein (63kD), endoplasmi 


1.00 


43.00 


403329 




Target Exon 


1.00 


61.00 


403381 




ENSP00000231844*:Ecotropic virus integra 


1.00 


119.00 


403478 




NM„022342:Homo sapiens kinesin protein 9 


28.13 


136.00 


403485 




G300 1 81 3*:gi 1 1 2737279|ref |XP_01 21 63. 1 1 k 


20.23 


76.00 


403627 




Target Exon 


6.30 


29.33 


403715 




Target Exon 


1.30 


35.00 


404044 




ENSP00000237855*:DJ398G3.2 (NOVEL PROTEl 


1.00 


54.00 


404076 




NM 016020*:Homo sapiens CGI-75 protein ( 


14.29 


91.00 


404101 




C8000950:gi|423560|pir|lA47318RNA-bindi 


1.00 


1.00 


404140 




NM__006510:Homo sapiens ret finger protei 


1.42 


1.44 


404165 




ENSP00000244562:NRH dehydrogenase [quino 


1.00 


54.00 


404165 




Target Exon 


1.00 


117.00 


404210 




NM_005936:Homo sapiens myeloid/lymphoid 


5.93 


13.77 


404253 




NMJ)21058*:Homo sapiens H2B histone fami 


1.00 


1.00 
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i) 


r*ci\<\4 nnn.^inn a A a 4 1»iu:ie> a a 4 oonn <ii fnifio 
C6001 909:gi|704441 |dbj|BAA1 8909.1 1 (U298 


OQ 74 
29./1 


ao nn 
42.UU 


404298 






C6001 238 :gi[121 71 5|sp|P26b97|GlA3_UHICK 


4 on 
1.30 


4 nn 
l.UU 


Af\AOA7 

404347 






Target Exon 


4 nn 


1 nn 
l.UU 


404440 






NM_021048:Homo sapiens meianoma anogen, 


4 nn 
l.UU 


ic nn 
IO.UU 


404721 






NM_00ooyb :Homo sapiens nuclear tactor i 


l.UU 


cn nn 
bU.UU 


404/y4 


NM_00007o 




cnoiesteryi esier iransier protein, pias 


1 A7 

1 .11/ 


1 QR 

I.Jo 


A f\ A or A 

404854 






Target Exon 


1 R4 

l.bl 


0 ni 
z.Ul 


At\A Q77 

4048/ 1 






NM_uU5obb.riomo sapiens meianoma antigen, 


1 nn 

l.UU 


1 nn 

l.UU 


404927 






Target Exon 


1 OA 
l.UU 


1 nn 

l.UU 


a r\ inn/? 

404996 






Target Exon 


4 nn 
l.UU 


1 nn 
l.UU 


Ai~tC A Ad 

405449 






LYU0UU4/ :gi|n4z/2o4|rei|Ar_uuyjyy.i| z 


1 nn 

l.UU 


1 nn 

l.UU 


405568 






NM_031413 .Homo sapiens cat eye synarome 


•1 nn 

l.UU 


7Q nn 

I o.UU 


405572 






Target Exon 


n 7R 


1 1 4 
1.14 


405646 






ui20UU20U:gi|4bbf z2b|retiiNr_uuuuuo.i| ai 


l.U 1 


1 OR 
l.ZO 


J rt T- f>~l A 

405676 


nrAA/?7<i A 

BE336714 




cytochrome c-1 


4 1*3 


O QQ 

z.oy 


405770 






A. 1 A A AAAAAA.t 1 - — — ^> ? _ — _ - -■ _n_f j- ■ t_-l 

NM_002362:Homo sapiens meianoma antigen, 


VIC CO 

40.52 


ot nn 
3/.UU 


405932 






C15000305.g)|38Ub122|gDjAAO69l98.l| (AhO 


j.yy 


1 QQ 

i.yy 


Ar\cA m 

406137 






kill f\f\fH7n*.LJ^mn pppippp miltC /C pnlt\ K 

NM„ooui /9 :Homo sapiens mutb (b. con) n 


tZ.lt 


0 OQ 
Z.OO 


406360 






I arget bxon 


1 nn 

l.UU 


qc nn 

OO.UU 


406399 






A 1 A j| AAA4 AAtil-l*wAi^ f***nirtrtrt **rtvi#%rt nrA^A^Pn 

nm„uuoiZZ .nomo sapiens serine protease 


1 nn 

l.UU 


^q nn 
oy.uu 


A A A A 

406467 






Target bxon 


i nn 

l.UU 


1 nn 

l.UU 


406621 


X57809 


If-. 4 A 4 4 AC 

HS. 181125 


immunoglobulin lambda locus 


1.41 


1 7 A 
1./4 


406642 


AJ 2452 10 




gbiHomo sapiens mKNA tor immunoglobulin 


c. ID 


*3 01 


4UbbbJ 


U24b8J 


nS.Z9344 1 


immunoglobulin neavy constant mu 


9 07 
£.M( 


9 01 


Af\CC74 

406671 


AA 129547 


M _ OQC7C/I 

HS.28bf 54 


- j^, A «^ r «v n rt rt ^> f W rt rt rt T rt rtl f 4 /% nmtltlK Trt 

met proto-oncogene ^nepatocyte growtn ta 


1^ nn 


ci nn 
o 1 .uu 


406673 


M3499D 


Up HOQOCO 

nS.19b2o3 


•^*rtirt»" rt ■ rtirt n.rs. i^rt rt rt 4 1 rti 11 ■ 4i t rt rt rtr^ rt 1 rt \* rtlrtr'f^ 

major nistocompaiiDiiiiy complex, ciass 


n qr 
u.yo 


9. no 


A AA A "7f? 

406676 


vcoonn 

X58399 


HS.81221 


1 li ivvi^rt 1 A Ar iH/mnorirst r\ (• t * rt r*rt rt n^rt rt rt rt /"J Irtrt 

Human L2-9 transcript or unrearrangea im, 


1 ^n 


1 C9 


40bb78 


U/ /bJ4 




rt • l_l f irt~i rt rt, rtfrtrtrt 4. A 4 4 *rrt mt 1 n AA 1 rtrt.i ill n 1 1 rt rl rt 

go.numan clone iaii immunogiouuiin vana 




J .40 


406685 


M1 8728 




gb: Human nonspecific crossreacting an tig 


1.40 


9 QR 


406687 


M31126 


Up O70QO0 

HS.272822 


,>> m rt rt rt rt rtt t rt rt rt rtl^lrt rt 4 rt 1 rt It f rt rtrt ^rtirt 1 rt O 

pregnancy specinc oeta-i -glycoprotein y 


0.0 I 


ft cn 
o.ou 


406690 


M29540 


HS.220529 


nMri^inn^mUm mni/\ rtrt4i#vrtrt ■•rtlrtTrtrt rtrtll rtrt 

carcinoembryonic anugen-reiateo ceil aa 


OOP. T7 


9cn nn 
oou.uu 


406698 


X03068 


Up "7 < 3flO< 

Hs.73931 


major nistocompatiDiiity complex, class 


1 AI 
l.U I 


9 C9 
Z.OZ 


406815 


A. A AAAAAA 

AA833930 


1 1_ A A A A A A 

Hs.288036 


tRNA isopentenylpyrophosphate transferas 


on Oc 
20.2b 


09 nn 
32.UU 


4 aaoc 4 

406851 


A A AAO*7A J 

AA609784 




major histocompatibility complex, class 


n 7K 


1 Q1 

i.yi 


406964 


i ini oAr 

M21305 




gb:Human alpha satellite and satellite 3 


CO 4 r 

38.15 


nn 

1114.UU 


406967 


M24349 




. 1 1 t k r-rt rt rt n ,— . — « 1 1-. . i^AI^J rt rt PrV^ rt rt rt. 1 ■ |>rt rt F*rt4rt 1 

go. Human paratnyroid normone-HKe protei 


1 AO 
l.UU 


1 nn 

l.UU 


406974 


A JC7009 

M57293 




litMtMn ***rt 4 1> > j rrt < »J t>rt«»rt^rtrt/^ »» rt 1 rt t rt f\ rt rt rt 

gD.numan paratnyroja normone-reiatcu pep 


1 nn 

l.UU 


1 nn 

l.UU 


407103 


A A A HAQ04 

AA424881 


Up OCCOn4 

HS.25b3U1 


nypotneticai protein Mboioi/u 


1 77 
l./f 


1 m 

1. IU 


4 a~7 •! on 

407128 


R83312 


Hs.237260 


COT 

EST 


n nn 
l.UU 


1 nn 

l.UU 


407137 


T97307 




nlvti lAuOnfitT ««4 t^rtrtt"rt#» »rt4rtl lltfrt** rtrtlrtrtrt 

gb:yeoonub.si ooaresietai liver spleen 


140 7n 


19c nn 

I JO.UU 


it ATI 4 CO 

407168 


R45175 


Up 4 4 ~34 OO 

Hs.1 17183 


cols 


Z. IQ 


in nn 

IO.UU 


a a*7a a a 

407239 


AA076350 


Up CtQAG 

HS.67846 


1 _ . kl*rtrtt*4rt \ «p*-s * 1 rt rt rt 1 rt * 1 1 1 rt |!|y j-s rt rt rt trt *> 

leukocyte immunogiobulin-UKe receptor, 


1 m 

1. IU 


1 C7 
1.0/ 


407242 


M18728 




_L * 1 1 » ■ pv«rt rt rt rt rt rt rt rtrt ifirt rt #>rt rt rt «• rt rt rt f i rt rt rt rt 4l rt 

go.Human nonspecitic crossreacting antig 


1 10 
I. iz 


9 RC 
Z.OO 


407244 


1 4 4 AA4 A 

M10014 


1 1 _ TCA04 

Hs.75431 


fibrinogen, gamma polypeptide 


•3 OA 


1C OQ 
10.00 


407289 


A A A A f7 4 Cf\ 

AA135159 


1 }~ A AAA A A 

Hs. 203349 


1 1 mmha rt rtrt.AB.rt rt r^Kt A tTI |4A4 4Ar!_ *I AM 1 J A 

Homo sapiens cUNA FLJ12l4y tis, clone MA 


0.00 


0 CQ 
0.00 


M 0"f A Art 

407300 


A A A AAA A A 

M102616 


1 I* 4 AA7 A A 

Hs.1 20769 


J A^A^ _4 Ou-tM-AWA I_lrt1 >>* rtrtll *»o no 

gb:zn43e07.s1 Stratagene HeLa cell s3 93 


1Q 7jI 


70 nn 
M.UU 


j rt*"»r^ rtrt 

407366 


A r^rtA A A A rt 

AF026942 


1 1 _ r\-t A rlA 

Hs.271530 


gb:Homo sapiens cig33 mRNA, partial sequ 


n nc 
U.Ub 


Q 9C 

o.zo 


407378 


A A AAAOA J 

AA299264 


1 1— r77l/* 

Hs.57776 


ESTs, Moderately similar to (38022 nypot 


1 nn 
1.00 


oc nn 
zb.UU 


a f\~r Ann 

407430 


A t~A AAAr* 4 

AF1 69351 




\ 11 _j in ri KKniAatM M#iklAin 4* t^rtrt ■ h« rt rt rt rt rt 

gb:Homo sapiens protein tyrosine pnospna 


•1 nn 
l.UU 


oc nn 
ZO.UU 


407453 


AJ 1 32087 




^kLv * 1 1 j-ij-l j-i >^ ■ a rt rt rtrt [ 1 0k 1 A rt i* rt^L#rt\ rt rt Pnrt rt^l rt^ t J rt n 

gu:Honio sapiens mKNA tor axonsmai aynGin 


1 nn 
l.UU 


7C nn 

f O.UU 


A A*7/?"7*7 

407577 


A I AM A 4 A A A 

AW131324 


1 t_ rt a A7L*n 

Hs, 246759 


hypothetical protein MGC1 2538 


1 nn 
l.UU 


1 nn 
l.UU 


407634 


A I A f A 4 A f~ A A 

AW016569 


IL 4 A A 4 4 A 

Hs. 136414 


I i nj y"M aAI a ..UaIaA*.! l^i. 4 OKI «-aIi «lrt 1 ■ < rt 

UDP-GIcNAc:betaGal beta-1 ,3-N-acetylgluc 


444 on 
111.2U 


99Q nn 
zzo.UU 


407710 


A1A /AA A A "7 

AW022727 


Up OOC<l C 

HS.23616 


ESTs 


1 nn 
l.UU 


9Q nn 

ZO.UU 


407720 


A n A A "7*7 "7 A 

AB037776 


Hs.38002 


KIAA1355 protein 


1 no 
i.oy 


1 01 


AMI AC 

40774b 


AKOOlybz 




rt i j rt rt 4 rt rtilrt rt t rt rrt 4rt in CI 1114 Oi Ol 

nypotneticai protein rumuu 


1 nn 

l.UU 


1 nn 

I .uu 


407756 


A A A A A A A4 

AA1 16021 


Up OOlCft 

HS.38260 


ubiquitin specific protease lo 


A Ki 
4.01 


c nn 

O.UU 


407758 


nrAA*l c 

D50915 


If- AAACC 

Hs. 38365 


l/i a A AH AC Mrtrtrt rt»rtrJ*irti 

KIAA0125 gene product 


1 nn 
l.UU 


9R nn 

ZO.UU 


407782 


a Acnoncc 
AAbObybb 


Up 4 4 9C1 O 

HS.Hzbiy 


bo is, Moaerateiy similar to rUKNiNJt l>cl 


n 07 
u.y» 




407788 


nrf "1 4 AAA 

BE514982 


Up Iat\ft4 

HS.38991 


A 1 4 A A haIaii km rt ■ rt rt 1 rt n»rt4rtlrt A A 

falOO calcium-binding protein A2 


7 QQ 

(.00 


9 fl9 


407790 


A1027274 


Hs, 288941 


1 i.„ A pppSppp — A CI 1 4 A DCC (!« -U nn n| 

Homo sapiens cUinA FLJi48bb fis, clone rL 


Q CO 

o.bo 


49 nn 

4Z.UU 


40781 1 


AW1 90902 


Up jinnno 

HS.40098 


M«krtlrttrtrt 1* rtrt 4 AilMA^nmilll 4 DA JD rtrt 4 rtrt rtrt 

cysteine knot supertamiiy \, bMH antagon 


OQ OR 


ina nn 
i uy.uu 


407839 


A A A A C4 A A 

AA045144 


Up 

Hs.1 61566 


ESTS 


17^ 01 


inn nn 

IUO.UU 


Af\7t\ A A 

407944 


R34008 


Up 09(V7'V7 

HS. 2397 27 


desmocollin 2 


in ^n 
n i.ou 


7n nn 
f u.uu 


408000 


L1 1690 


Up CIA 

Hs.620 


bullous pempmgoid antigen i 123U/24Ukuj 


1C1 17 
IO l.l / 


ft nn 

O.UU 


J/\0 A A4 

408031 


A AAA4AAI? 

AA081395 


1 J04~7A 

Hs.42173 


Homo sapiens cDNA FLJ103bb fis, clone NT 


y.yi 


qo nn 
yj.uu 


A AflA AA 

408063 


BE086548 


Hs.42346 


calcineurin-binding protein calsarcin-1 


IOC "7Q 

iyb./8 


001 nn 
231. UU 


408070 


AW1 48852 




gb:xf05d05.x1 NCI_CGAP_Brn35 Homo sapien 


1 nn 
l.UU 


1 nn 
l.UU 


A rt O 4 A 4 

408101 


A 1 A XAA AAA A 

AW968504 


1 k j ri A A*7 A 

Hs.1 23073 


CDC2-related protein kinase 7 


07 OA 

of .84 


R4 nn 


408122 


AI432652 


Up JOOOyt 

Hs.42824 


nypotneticai protein rUlO/lo 


n nc 

U.00 


1 71 

1,/ 1 


408212 


A A KY7ITC'7 

AA2y7oo7 


Up yt^^OO 

HS.43728 


nypotneticai protein 


c 

0.00 


7 01 


408243 


Y00787 


Up eivi 
Hs.624 


interleukin 8 


A 07 


Q Oft 

y.yo 


40834a 


Bbo4b947 


Up yl>l<T7C 

HS.44276 


nomeo box uiu 


70 

0. /y 


9 4ft 
0.40 


408353 


BE439838 


Hs.44298 


«tlrt » J « «t ^Urtrtrtr-» n l rtitrtlrtirt 04*7 

mitochondnal nbosomal protein S17 


1 


1 RC 

l.bb 


MflAf A 

408354 


A IOQOOAO 

A1382803 


Up <cnior 

Hs. 159235 


ESTs 


1 nn 
l.UU 


79 nn 
/o.UU 


A AA A AA 

408369 


R3B438 


Up "1 OOC7C 

Hs. 182575 


_ — 1 . .1a -— » ■ ^ — f M yM!lll 4 C / 1 _ J A A A 4a*A H% m% rt *-4 

solute carrier family 15 (H i i i transport 


1 A4 

1.41 


1ft CA 
10.0U 


408380 


AF1 23050 


Hs.44532 


di ubiquitin 


1C in 

lo.iy 


97 99 
0/ ,zz 


4AA iflA 

408482 


NM_000676 


Hs.45743 


adenosine A2b receptor 


1 cc 

i.bb 


1 10 

i. ly 


408522 


A 1 r A A A A A 

A1541214 


I 1 _ i A AAA 

Hs.46320 


Small prohne-nch protein SPRK [human, 


1 OQ 


1 9>1 
1.Z4 


4U00O0 


A\A/9R1 C99 

AVVOO I00Z 


U. HOCI DO 

ns. Jobloo 


to 1 S 




1 50 


408545 


AW235405 


Hs.253690 


ESTs 


1.00 


1.00 


408572 


AA055611 


Hs.226568 


ESTs, Moderately similar to ALU4_HUMAN A 


1.00 


44.00 


408633 


AW963372 


Hs.46677 


PRO2000 protein 


107.16 


56.00 


408660 


AA525775 




ESTs, Moderately similar to PC4259 ferri 


1.00 


1.00 


408761 


AA057264 


Hs.238936 


ESTs, Weakly similar to (defline not ava 


52.24 


141.00 


408771 


AW732573 


Hs.47584 


potassium voltage-gated channel, delayed 


3.05 


109.00 
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408783 


a r"<ioof*oo 

AF1 92522 


1 ATTnA 

Hs.47701 


408790 


A l*/r*AAA A^ 

AW580227 


Hs.47860 


408805 


H69912 


Hs.48269 


j OOO J 4 

408841 


AW438865 


Hs.256862 


408873 


A) A 4 A A .4 ~7 

AL046017 


Hs. 182278 


j aaa a r\ 

408908 


n ^oo rt rt*r 

BE296227 


t 1 O CAOAA 

Hs.250822 


4 o n nnn 

408992 


AA059325 


1 l 7iPiA 

Hs.71642 


408996 


A 10*70 4 AO 

AI979168 


Hs. 344096 


409015 


BE389387 


Hs.49767 


409038 


~m~r Ann 

T97490 


Hs.50002 


jnnn A a 

409041 


AB033025 


Hs.50081 


4 000*7-7 

409077 


a a a t\A oen 

AA401369 


U_ HnA"70-l 

Hs.1 90721 


409093 


BE243B34 


HS.50441 


409103 


AF251237 


Hs. 112208 


Ann 4 A n 

409142 


AL1 36877 


Li*, cn-rco 

Hs.50758 


409187 


A r*«i C" 4 AAA 

AF154830 


HS.50966 


409228 


a lee j ono 

A1654298 


Hs. 271695 


j n n n a ji 

409234 


A lf1*7n A A O 

AI879419 


Hs. 27206 


409268 


A A AArA A J 

AA625304 


1 1^ A rt-Tff -TO 

Hs. 187579 


409269 


A A nnArA 

AA576953 


1 1 — AAA! o 

Hs.22972 


409361 


NM_005982 


Hs.54416 


409404 
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A1761324AW880941 AW880937 

AW118072AI631982T15734AA224195A1701458W20198 F26326 AA890570 N90552AW071907 AI671 352 A1375892 T03517 R88265 
Al 124088 AA224388 AI08431 6 AI354686 T33652 Al 14071 9 AI72021 1 T03490 A1372637 T15415 AW205836 AA630384 T03515 T33230 
AA017131 AA443303 T33623 AI222556 T33511 T33785 AI419606 D55612 

W52854AL1 17600 BE208116 BE208432 BE206239 BE082291 AW953423 AA351619 BE180648 BE140560 W60080 AA865478 N90291 
AW450652 AW44951 9 AA993634 AI806539 AA351618 AW449522 AI827626 AA904788 AA380381 AA886045 AA774409 BE003229 Z41756 
AL133619 AA468118 AA383064 A1476447 T09430 AI673758 M524895 AI581345 AI300820 AW498812 M256162 AI559724 AI685732 
AA602400 AA905453 AI204595 AW1 66541 AA1 57456 AA1 56269 AA383652 AA431 072 AW592707 AI43541 0 AW272464 AI21 5594 AA622747 
R74039N35031 A1804128 AW513621 AA868351 A1026826 A1493388 AA614641 W81604AI567080 AI214351 M730140 AI125754 AI200813 
AI269603 AI565082 A1807095 AI476629 AA505909 AI368449 AI686077 AI582930 AW085038 AA757863 AA7301 54 AI767072 AA46831 6 
AI734130 A1734138 M426284 AA433997 AI741241 AW043563 AI732741 AI732734 M437369 M425820 AA664048 R74130 
BE144666 BE184942 AW238414 BE184946 
AW993247AW861464 
AA203682 R11958 

BE550224AA832519 N45402 AW885857 N29245 BE465409 W07677 AW970089 AI299731 AA482971 BE503548 H18151 W79223 AF086393 
AA461301 W74510 R34182 AI090689 N46003 BE071550 R28075 AW134982 AI240204 AI138906 AW026179 A1572316 BE466182 AI206395 
A1276154AI273269 AI422817 AI371014 AI421274 A1188525 AA939164 BE549810 AW1 37865 AI694996 BE503841 AA459718 BE327407 
BE467534 BE218421 BE467767 M989054 BE467063 AI797130 BE327781 



TABLE 9C 

Pkey: Unique number corresponding to an Eos probeset 

Ref: Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled The DNA 

sequence of human chromosome 22." Dunham I. etal., Nature (1999) 402:489-495. 
Strand: Indicates DNA strand from which exons were predicted. 
NLposition: Indicates nucleotide positions of predicted exons. 



Pkey 


Ref 


Strand 


NLposition 


400512 


9796593 


Minus 


1439-1615 


400517 


9796686 


Minus 


49996-50346 


400560 


9843598 


Plus 


94182-94323,97056-97243,101095-101236,102824-103005 


400664 


8118496 


Plus 


13558-13721,13942-14090,14554-14679 


400665 


8118496 


Plus 


16879-17023 


400666 


8118496 


Plus 


17982-18115,20297-20456 


400749 


7331445 


Minus 


9162-9293 


400763 


8131616 


Minus 


35537-35784 


401027 


7230983 


Minus 


70407-70554,71060-71160 


401093 


8516137 


Minus 


22335-23166 


401203 


9743387 


Minus 


1 72961 -1 73056, 1 73868-1 73928 


401212 


9858408 


Plus 


87839-88028 


401411 


7799787 


Minus 


144144-144329 


401435 


8217934 


Minus 


54508-55233 


401464 


6682291 


Minus 


170688-170834 


401714 


6715702 


Plus 


96484-96681 


401747 


9789672 


Minus 


118596-118816,119119-119244,119609-119761,120422-120990,130161-130381,130468-130593,131097-131258,131866- 








131932,132451-132575,133580-134011 


401760 


9929699 


Plus 


831 26-83250,85320-85540,9471 9-95287 


401780 


7249190 


Minus 


28397-28617,28920-29045,29135-29296,29411-29567,29705-29787,30224-30573 


401781 


7249190 


Minus 


83215-83435,83531-83656,83740-83901,84237-84393,84955-85037,86290-86814 


401785 


7249190 


Minus 


165776-165996,166189-166314,166408-166569,167112-167268,167387-167469,168634-168942 


401797 


6730720 


Plus 


6973-7118 


401961 


4581193 


Minus 


124054-124209 


401985 


2580474 


Plus 


61542-61750 


401994 


4153858 


Minus 


42904-43124,43211-43336,4460744763,4519945281,46337-46732 


402075 


8117407 


Plus 


121907-122035,122804-122921,124019-124161,124455-124610,125672-126076 


402260 


3399665 


Minus 


113765-113910,115653-115765,116808-116940 


402265 


3287673 


Plus 


21059-21168 


402297 


6598824 


Pius 


35279-35405,35573-35659 


402408 


9796239 


Minus 


110326-110491 
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402420 


9796339 


Plus 


129750-129919 


402674 


8077108 


ft ■ ■ 

Minus 


39290-39502 


402802 


3287156 


Minus 


53242-53432 


402994 


2996643 


Minus 


4727-4969 


403137 


r\0 A A ft f\ A 

9211494 


Minus 


n^un ft^ni ftftnto norioj noc~7n mho AOftjio fiJir\*7n o^cru C\Ataq ftcnx ficoi7 

92349-92572,92958-93084,93579-9371 2,93949-94072,94591 -94743,9521 4-95.W 


403306 


8099945 


Plus 


127100-127251 


403329 


8516120 


Plus 


96450-96598 


403381 


9438267 


Minus 


26009-26178 


403478 


9958258 


Plus 


116458-116564 


403485 


9966528 


Plus 


2888-3001 , 31 98-3532,3655-41 1 7 


403627 


8569879 


ft i ' 

Minus 


23868-24342 


403715 


7239669 


Plus 


85128-85292 


404044 


9558573 


t ft 1 

Minus 


225757-225939 


404076 


9931752 


Minus 


aa jA n^>n*v 

3848-3967 


404101 


8076925 


ft ft* 

Minus 


125742-125997 


404140 


9843520 


Pius 


37761-38147 


404165 


9926489 


lit . 

Minus 


69025-69128 


404185 


4572584 


ft i* 

Minus 


iftAj ~j a a or\ A>r\*rr 

129171-129327 


404210 


5006246 


Plus 


j /~*r\fi*>/* A*7f\Ar\A 

169926-170121 


404253 


9367202 


Minus 


55675-56055 


404287 


2326514 


Plus 


»- rv 4 4 rn^n4 

53134-53281 


404298 


nn A inno 

9944263 


ft j» »- 

Minus 


73591-73723 


404347 


9838195 


Plus 


*Y 1 IAA — » J a A 

74493-74829 


404440 


7528051 


Plus 


80430-81581 


404721 


9856648 


ft ft' 

Minus 


173763-174294 


ft f\ A 1 

404794 


4826439 


Plus 


101619-101898 


404854 


7143420 


Plus 


14260-14537 


404877 


1519284 


PJus 


1095-2107 


404927 


7342002 


Plus 


/> fy f^jry s\ AAr/*/t 

68690-69563 


404996 


6007890 


Plus 


37999-38145,38652-38998,39727-39872,40557-40674,42351-42450 


405449 


7622497 


Plus 


42236-42570 


A j~\ r- m n n 

405568 


6006906 


Pius 


35912-36065 


405572 


3800891 


Plus 


85230-85938 


405646 


A f\ A 1 A r** Al 

4914350 


Plus 


741-969 


405676 


4557087 


Plus 


73195-73917 


405770 


2735037 


Plus 


61057-62075 


405932 


7767812 


Minus 


123525-123713 


406137 


9166422 


Minus 


30487-31058 


406360 


9256107 


Minus 


7513-7673 


406399 


9256288 


Minus 


63448-63554 


406467 


9795551 


Plus 


182212-182958 



TABLE 10A: Potential Therapeutic, Diagnostic and Prognostic targets for Therapy of Lung Cancer and Non-malignant Lung Disease 

Table 2A shows about 307 genes up-regulated in non-malignant lung disease relative to lung tumors and normal body tissues and/or down-regulated in iung tumors relative to 
normal lung and non-malignant lung disease. These genes were selected from about 59680 probesets on the Eos/AnVmetrix Hu03 Genechtp array. 

Table 10B show the accession numbers for those Pkey's lacking UnigenelD's for table 10A For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 10C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 10A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: 5 
ExAccn: 
UnigenelD: 
Unigene Title: 
R1: 

R2: 



Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

Average of lung tumors (including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid tumors) divided by the 
average of normal lung samples 

Average of non-malignant lung disease samples (including bronchitis, emphysema, fibrosis, atelectasis, asthma) divided by the average of normal lung samples 



Pkey 


ExAccn 


UnigenelD 


Unigene Title 


R1 


R2 


404394 






ENSP00000241075:TRRAP PROTEIN. 


0.79 


3,10 


404916 






Target Exon 


100 


159.00 


405257 






Target Exon 


1.00 


422.00 


407228 


M25079 


Hs. 155376 


hemoglobin, beta 


0.47 


2.33 


407568 


AA740964 


Hs.62699 


ESTs 


1.00 


123.00 


408562 


AI436323 


Hs.31 141 


Homo sapiens mRNA for KIAA1568 protein, 


1.00 


230,00 


409031 


AA376836 


Hs.76728 


ESTs 


1.00 


128.00 


410434 


AF051152 


Hs.63668 


toil-like receptor 2 


39.65 


149.00 


410467 


AF102546 


Hs.63931 


dachshund (Drosophila) homolog 


1.00 


109.00 


410808 


T40326 


Hs.167793 


ESTs 


1.14 


13,14 


412351 


AL1 35960 


Hs.73828 


T-cell acute lymphocytic leukemia 1 


0.37 


2.27 


412372 


R65998 


Hs.2B5243 


hypothetical protein FU22029 


1.00 


173.00 


413795 


AL040178 


Hs.142003 


ESTs 


0.10 


11.90 


414154 


AW205314 


Hs.323060 


ESTs 


0.62 


2.09 


414214 


D49958 


Hs.75819 


glycoprotein M6A 


0.03 


4.55 


414998 


NMJJ02543 


Hs.77729 


oxidised low density lipoprotein (lectin 


0.64 


2.97 


415122 


D60708 


Hs.22245 


ESTs 


0.07 


8.97 


415765 


NM_005424 


Hs.78824 


tyrosine kinase with immunoglobulin and 


0.67 


1.65 


415775 


H00747 


Hs.29792 


ESTs, Weakly similar to I38022 hypotheti 


0.29 


2.64 


415910 


U20350 


Hs.78913 


chemokine (C-X3-C) receptor 1 


1.00 


145.00 



170 



WO 02/086443 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



416319 


AI815601 


Hs.79197 


CD83 antigen (activated 6 lymphocytes, t 


15.32 


237.00 


416402 


NM 000715 


Hs.1012 

V «w« * • ^™ 


complement component 4-binding protein, 


0.64 


4.00 


417355 


D13168 


Hs.82002 


endothelin receptor type B 


0.01 


3.90 


417421 


AL1 38201 


Hs.82120 


nuclear receptor subfamily 4, group A, m 


36.30 


357.00 


417511 


AL049176 


Hs.82223 


chordin-like 


1.00 


179.00 


418489 


U76421 


Hs.85302 


adenosine deaminase, RNA-specific, B1 (h 


0.02 


6.00 


418726 


BE241812 


Hs.87860 


protein tyrosine phosphatase, non-recept 


1.00 


113.00 


418741 


H83265 


Hs.8881 


ESTs, Weakly similar to S41044 chromosom 


0.44 


1.90 


418883 


BE387036 


Hs.1211 


acid phosphatase 5, tartrate resistant 


0.96 


2.04 


419086 


NM.000216 


Hs.89591 


Kallmann syndrome 1 sequence 


0.62 


2.74 


419150 


T29618 


Hs.89640 


TEK tyrosine kinase, endothelial (venous 


0.03 


6.90 


419235 


AW470411 


Hs.288433 


neurotrimin 


1.48 


5.13 


419407 


AW410377 


Hs.41502 


hypothetical protein FLJ21276 


37.55 


336.00 


420556 


AA278300 


Hs.124292 


Homo sapiens cDNA: FLJ23123 fis, clone L 


0.80 


3.65 


420656 


AA279098 


Hs.187636 


ESTs 


1.65 


8.07 


420729 


AW964897 


Hs.290825 


ESTs 


2.99 


25.82 


421177 


AW070211 


Hs.102415 


Homo sapiens mRNA; cDNA DKFZp586N0121 (f 


0.46 


1.95 


422060 


R20893 


Hs.325823 


ESTs, Moderately similar to ALU5_HUMAN A 


1.00 


156.00 


422426 


W79117 


Hs.58559 


ESTs 


0.03 


7.44 


422652 


AW967969 

1 il • « w # V w w 


Hs. 118958 


syntax! n 1 1 


0.14 


3.62 


423099 


NM 002837 


Hs.123641 


protein tyrosine phosphatase, receptor t 


0.01 


3.16 


424433 


H04607 


Hs.9218 


ESTs 


0.75 


141.75 


424585 


AA464840 


Hs. 131987 


ESTs 


1.00 


167.00 


424711 


NM_005795 


Hs.152175 


calcitonin receptor-like 


0.43 


3.01 


424973 


X92521 


Hs. 154057 


matrix metalloproteinase 19 


0.37 


19.45 


425023 


AW956889 


Hs.154210 


endothelial differentiation, sphingolipi 


0.14 


3.35 


425664 


AJGQ6276 


Hs.159Q03 


transient receptor potential channel 6 


1.00 


94.00 


425998 


AU076629 


Hs. 165950 


fibroblast growth factor receptor 4 


0.68 


1.42 


426657 


NM_015865 


Hs.171731 


solute carrier family 14 (urea transport 


0.03 


3,74 


426753 


T89832 


Hs. 170278 


ESTs 


1.00 


141.00 


427558 


D49493 


Hs.2171 


growth differentiation factor 10 


1.00 


117.00 


427983 


M177Q6 


Hs.2233 


colony stimulating factor 3 (granulocyte 


0.75 


2.20 


428467 


AK002121 


Hs. 184465 


hypothetical protein FLJ11259 


0.76 


2.25 


428927 


AA441837 


Hs.90250 

1 IW»WW«*"*V 


ESTs 


0.01 


3.62 


429496 


AA453800 

r V X * W W W V 


Hs.1 92793 


ESTs 


1.00 


138.00 


430468 


NM 004673 


Hs.241519 


angiopoietin-like 1 


1.00 


132.00 


431385 

TV 1 Www 


BE1 78536 

wtf* J V ^»^*X^XP 


Hs.11090 


membrane-spanning 4-domains, subfamily A 


1.00 


157.00 


431728 


NM 007351 

1 ill i^- lu w W 1 WW 1 


Hs.268107 


multimerin 


1.00 


157.00 


431848 


AI378857 


Hs. 126758 


ESTs, Highly similar to AF1 75283 1 zinc 


0.34 


2.24 


432128 


AA1 27221 


Hs.1 17037 


ESTs 


0.00 


1.15 


432519 


AI221311 


Hs.1 30704 


ESTs, Weakly similar to BCHUIA S-100 pro 


0.01 


2.06 


433043 

1 W W V » V 


W57554 


Hs.1 2501 9 


lymphoid nuclear protein (LAF-4) mRNA 


1.00 


267.00 


433803 


AI823593 


Hs.27688 


ESTs 


1.00 


105.00 


434730 


AA644669 


Hs.1 93042 


ESTs 


1.05 


3.15 


435472 


AW972330 


Hs.283022 


triggering receptor expressed on myeloid 


0.83 


1.94 


436532 


AA721522 




gb:nv54h12.r1 NCI CGAP_Ew1 Homo sapiens 


1.00 


218.00 


437119 


AI379921 

• **w ■ WW»™V 


Hs,177043 


ESTs 


1.00 


133.00 


437140 


AA312799 


Hs.283689 


activator of CREM in testis 


0.67 


122.67 


437211 


AA382207 


Hs.5509 


ecotropic viral integration site 2B 


1.00 


142.00 


437960 


A1669586 


Hs.222194 


ESTs 


1.00 


147.00 


438202 


AW1 69287 


Hs.22588 


ESTs 


1.00 


141.00 


438873 


AI302471 


Hs.124292 


Homo sapiens cDNA: FLJ23123 fis, clone L 


0.71 


3.66 


438875 


AA827640 


Hs.1 89059 


ESTs 


23.32 


370.00 


441048 


AA913488 


Hs.192102 


ESTs 


0.77 


8.50 


441188 


AW292830 


Hs.255609 


ESTs 


3.43 


16.36 


441499 


AW298235 


Hs.101689 


ESTs 


1.00 


167.00 


444513 


AL120214 


HsJ117 


glutamate receptor^ ionotropic, AMPA 1 


1.00 


151.00 


444527 


NM 005408 


Hs.1 1383 


small inducible cytokine subfamily A (Cy 


46.47 


153.00 


444561 


NMJJ04469 


Hs.1 1392 


c-fos induced growth factor (vascular en 


0.01 


3.08 


445279 


R41900 


Hs.22245 


ESTs 


0.60 


141.00 


446017 


N98238 


Hs.55185 


ESTs 


0.18 


2.39 


446984 


AB020722 


Hs.16714 


Rho guanine exchange factor (GEF) 15 


0.10 


2.16 


446998 


N99013 


Hs.1 6762 


Homo sapiens mRNA; cDNA DKFZp564B2062 (f 


0.01 


2.53 


447357 


AI375922 


Hs.1 59367 


ESTs 


0.46 


2.64 


448106 


A1800470 


Hs.171941 


ESTs 


18.05 


296.00 


448253 


H25899 


Hs.201591 


ESTs 


1.00 


141.00 


449275 

1 1 Wb # W 


AW450848 


Hs.205457 


Deriaxin 


0.56 


1.38 


450400 

~w w^ WW 


AI694722 


Hs.279744 


ESTs 


0.88 


4.33 


450696 

I W W W W w 


AI654223 


Hs.1 6026 

V IWi | v W W 


hypothetical protein FLJ23191 


0.52 


2.08 


450726 


AW204600 


Hs.250505 


retinoic acid receptor, alpha 


0.79 


2.01 


451497 


H83294 


Hs.284122 


Wnt inhibitory factor-1 


0.35 


2.03 


451533 


NM 004657 


Hs.26530 


serum deprivation response (phosphatidyl 


0.13 


2.25 


453636 


R67837 


Hs.1 69872 


ESTs 


1.00 


116.00 


458332 


AI000341 


Hs.220491 


ESTs 


1.00 


192.00 


459580 


AA022888 


Hs.176065 


ESTs 


0.20 


2.98 


400269 






Eos Control 


0.40 


2.40 


403421 






NM_016369*:Homo sapiens claudin 18 (CLDN 


0.53 


1.77 


407570 


Z19002 


Hs.37096 

■ ■ XP 1 ■ WW 


zinc finger protein 145 (Kruppel-like, e 


0.01 


3.18 


412295 


AW088826 


Hs.117176 


poly(A)-binding protein, nuclear 1 


0.56 


1.74 


414517 


M24461 


Hs.76305 


surfactant, pulmonary-associated protein 


0.64 


1.50 


417204 


N81037 


Hs.1 074 


surfactant, pulmonary-associated protein 


0.33 


1.16 


418307 


U70867 


Hs.83974 


solute earner family 21 (prostaglandin 


0.53 


1.55 


418935 


T28499 


Hs.89485 


carbonic anhydrase IV 


0.20 


1.28 


421502 


AF111856 


Hs.105039 


solute carrier family 34 (sodium phospha 


0.78 


1.90 


421798 


N74880 


Hs.29877 


N-acylsphingosine amidohydrolase (acid c 


0.59 


1.54 
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493354 


AR011130 

nuu 1 1 1 viu 


Hs 127436 


49373R 

HiOl OU 


AR0091 34 

nuuU£ io*t 


Uc 1^9195 


49591 1 


IUI1RRR7 
ivi lovjuf 


Hq 1RR7 
n&. iouf 


49543R 


TR991R 

1 \JC£- 1 U 


He 970R40 


49RR9R 


MM 000090 


H<5 179R70 

l to. 1 f £.U / u 


497019 


AA001732 

rVVJxJ 1 1 Ot. 


no. • i o^uj 


493043 


TQ294R 


He 9940 


4909R0 


AA3R125R 


H<; 937R6R 

I lO.^-Ol uuu 


411433 

*to \HOO 


yR50ifl 

AUJU I o 


He 253495 


431723 

*TU I 1 fcO 


AW058150 


Hs 16762 


439QR5 


T92363 


Hs 178703 


441R35 


AR03R439 


He 184 


442275 


AW449467 


Hs 54795 


443709 
*+*t«jf us 


AI0R9699 


Hs 134662 


444125 


AW152618 


Hs 16757 


450954 


A1904740 


Hs 25691 


451558 


kim 001089 


Hs 26630 


453310 


X70697 


Hs 553 


45RR55 


AF035528 


Hs 153863 


444342 


mm 014398 

l\IVI_VJ 1 tUSU 


Hs 10887 


400754 

4UUI Ot 






401045 

HU IUHJ 






401 0R3 






402474 






402R0R 






403021 






403438 






403687 






403764 






404277 






404288 






40451 R 

*rU*tO 1 U 


A1816601 




4051 OR 

4Uo 1 UQ 






4053R1 

HUooP 1 






40R3R7 






406646 

HUUUtU 


IVI JOUUU 




40R714 


AI91Q104 

AM/- 1 sOU*r 


He 2RR959 


40R753 

*tUUf UO 


AA506665 

rVrAoUUUUO 


He 917493 


406Q73 

■ft/USf O 


M34QQ6 


Hs 198253 


40794R 

HUf 4LHQ 


1 IR9975 


He 94498 


407510 

H\Jl O 1 U 


MQR1Q1 
usu 1 9 i 




407731 

HU/ f O 1 


MM OOOOfifi 

INIVI uuuuuu 


He 3R069 


407R30 

H\JI OOU 


NM 0010RR 

MIV1_ UU IUUU 


Hs 5R7 


40R045 


AW13R95Q 

fAVV IOUSOS 


He 245123 


40R074 


R90793 




40R374 


AW095430 


Hs 155591 


4090R4 


AA082Q54 


Hs 141883 

no* i *r i uuv 


40Q0R3 


AF0500R3 


He 673 


40Q153 

HUS lOO 


W03754 


Hs 50813 


409901 


AA7R0473 


He RR7 


40Q93R 


Al 04Q990 


He 61515 

JIO.O 1 0 1 O 


40Q3RQ 


AR007979 


Hs 301281 


40Q71R 

*?Us7 IO 


DRRR40 


Hs 56045 


4107QR 


RP17RR99 


Hs 16291 

no« i u J-C/ 1 


411090 


NM 006770 


Hs 67726 


41 1RR7 


RF1R019R 




419000 


AW57R555 


He 15780 

I IO. 1 O f UU 


41 935R 


RF047490 


Hs 24172 

1 I9.£*T lit. 


412420 


AL 035668 


Hs 73853 


4125R4 


XR3703 

AUUf Uv> 


Hs 31432 


41 2RRQ 


AA9Q0712 


Hs 82407 


412870 

1 1 fcU I u 


W22788 


Hs 82407 


413529 


U11874 


Hs 846 


413533 


BF 146973 




41 3RRQ 


RF1572R6 


Hs 20631 


41 3794 


AA131466 


Hs 23767 

1 IO«^w f Uf 


41 3R00 


AI19Q93R 


He 192235 


413R02 


AWQR4490 


Hs 32241 


41 1R9Q 


MM 001 R79 

I\JV1_UU 1 U / <t 


He 76572 
no. I oo/ £. 


41437R 


RF393R56 


He 66915 

1 IO.UUJ7 1 O 


414577 


AI05R54R 


H«? 72116 

1 IO. 1 C 1 I u 


414700 


HR3909 


He 3R1R3 
no. oo luo 


41507R 


AA311993 

/A/AO I 1 ££0 


He 9R3091 


415190 


Wfi44R4 


He 34950 


41 5191 
I oOCO 


RF9RQ359 


He Q49 


416315 


AAR47758 


He 111030 

1 IO ■ 1 1 1 UOU 


41 55R9 

*t i OoO£ 


WQ9445 


He 165195 
> id. i uo i so 


41R030 


H 15261 

1 1 1 0£U 1 


He 91948 


418497 


BF244050 


He 79307 

1 IO. 1 SOU I 


416464 


NMJ00132 


Hs.79345 


416585 ' 


X54162 


Hs.79386 


416847 


L43821 


Hs.80261 


417148 


AA359896 


Hs.293885 


417370 


T28651 


Hs.82030 


417673 


T87281 


Hs.16355 



calcium channel, voltage-dependent, alph 
airway Irypsin-like protease 
progastricsin (pepsinogen C) 
ESTs 

activin A receptor type I Mike 1 

hypothetical protein FLJ 10970 

uteroglobin 

interleukin 7 receptor 

surfactant, pulmonary-associated protein 

Homo sapiens mRNA; cDNA DKFZp564B2062 (f 

ESTs 

advanced glycosylation end product-speci 

ESTs 

ESTs 

ESTs 

receptor (calcitonin) activity modifying 
ATP-binding cassette, sub-family A (ABC1 
solute carrier family 6 (neurotransmitte 
MAD (mothers against decapentaplegic, Dr 
similar to lysosome-associated membrane 
Target Exon 

C1 1001883*:gil6753278|ref(NP JJ33938.1 1 c 
NMJ)16582*:Homo sapiens peptide transpor 
NlvLG04079:Homo sapiens cathepsln S (CTSS 
ENSP00000235229:SEMB. 
C21000030:gi|9955960Iref|NP_063957.1lAT 
NM_031 41 9*:Homo sapiens molecule possess 
NM_007037*:Homo sapiens a disintegrin-li 
NM_005463:Homo sapiens heterogeneous nuc 
NrvL0191 1 1*:Homo sapiens major histocompa 
NM_0Q2944*:Homo sapiens v-ros avian UR2 
CD83 antigen (activated B lymphocytes, i 
C1 1001 637*:gi|5032241 |ref |NP_005732. 1 1 z 
Target Exon 
Target Exon 

major histocompatibility complex, c)ass 
hemoglobin, gamma G 
annexin A2 

major histocompatibility complex, class 
leukocyte immunoglobulin-like receptor, 
gb:Human trophoblast hypoxia-regulated f 
complement component 8, beta polypeptide 
arylacetamide deacetylase (esterase) 
ESTs 
ESTs 

forkhead box F1 
ESTs 

interleukin 12A (natural killer cell sti 
hypothetical protein FU20022 
cytochrome P450, subfamily IVB, polypept 
Homo sapiens mRNA; cDNA DKFZp564G1 12 (fr 
Homo sapiens mRNA, chromosome 1 specific 
sre homology three (SH3) and cysteine ri 
gb:PM3-HT0605-270200-001-a02 HT0605 Homo 
macrophage receptor with collagenous str 
gb:QV1-HT0413-010200-059-h03 HT0413 Homo 
ATP-binding cassette, sub-family A (ABC1 
ESTs 

bone morphogenetic protein 2 

cardiac ankyrin repeat protein 

CXCchemokine ligand 16 

CXC chemokine ligand 16 

interleukin 8 receptor, beta 

gb:QV4-HT0222-01 11 99-01 9-e05 HT0222 Homo 

zinc finger protein, subfamily 1A, 5 (Pe 

hypothetical protein FLJ 12666 

ESTs 

ESTs, Weakly similar to S65657 alpha-1 C- 

carboxypeptidase B2 (plasma) 

ESTs, Weakly similar to 16.7Kd protein [ 

hypothetical protein FLJ20992 similar to 

ESTs 

found in inflammatory zone 3 
ESTs 

neutrophil cytosolic factor 2 (65kD, chr 
ESTs 

Homo sapiens cDNA FLJ 14237 fis, clone NT 
ESTs 

Rac/Cdc42 guanine exchange factor (GEF) 
coagulation factor VIII, procoagulant co 
leiomodin 1 (smooth muscte) 
enhancer of fomentation 1 (cas-likedo 
hypothetical protein FLJ14902 
tryptophanyMRNA synthetase 
ESTs 



PCT/US02/12476 



059 


1 55 

1 • WW 7 


10 14 


51.00 


0 35 


1 62 

1 * W£* 


0 23 


9 45 

w • i w 


0 03 


1 71 


0 01 


1 49 

1 • • w 


0 42 


1 26 


0 46 


2 43 

Ul IW 


0 57 


1 59 

I « WW 


029 


1 80 

1 • WW 


0 32 


2 27 

bib i 


0 31 


1 51 

1 ♦ W 1 


0 55 


1 78 

1 * 9 W 


0 00 


3 02 


0 32 


249 


0 46 


1 74 


0 52 


1.87 


0 00 

v«vw 


3.30 


0 01 


2 31 


0 66 


2 20 

** i *-W 


1 00 


297 00 

i— W 1 * w w 


1 00 


109.00 

1 w w » w w 


0 89 


1 39 

1 « w w 


1 45 


447 


1 00 


1.87 


1 00 


149.00 


1 06 


2.96 


0 04 


4.89 


1 00 


225.00 


0 97 


1.93 


1 00 


68.00 


0 02 


1.83 


1 00 


235 00 

A_W w* w w 


1 00 


93.00 


1 37 


6 02 

Wi w 


0 86 


2 46 

X- > i w 


0 01 


3 19 

W* 1 w 


1 00 


147 00 

1 « ■ ■ WW 


1 03 


2.04 


1 00 


64 00 

W I » w w 


1 00 


90.00 


1 00 


67.00 

Wl • WW 


1 00 

1 (WW 


102 00 

9 VlftV W 


1 00 


70 00 

I WtWW 


1 00 


112 00 

1 I w w 


0 07 

w« w 1 


10 17 

1 W* I 1 


0 39 


2 31 

b* w | 


1 00 

J (VV 


95 00 

w w> w w 


0 01 

w* w l 


455 

* • w w 


0 01 

w • w 1 


372 


1 00 

1 ♦ WW 


79.00 


0 14 

w • J *T 


27.35 

*- 1 *ww 


1 00 

1 • w w 


113.00 


0 64 

w ■ W 1 


2.47 


0 55 

W* W W 


2.40 


1 00 

1 k W W 


111 00 

III • w w 


1 00 


95.00 

w w • w w 


1 00 

1 •WW 


87 00 

W t i w w 


1 43 


8.07 

W« W f 


0 02 


3.07 


0 93 

w • w w 


1.72 


0 97 

W ' w 1 


1.51 

1 * W 1 


0 02 


2 42 


0 65 

W« WW 


1.50 

1 < w w 


20 87 


232.00 

*— w *— ■ WW 


1 00 

1 • WW 


80.00 


1 00 

1 « w w 


85.00 


1 00 


213.00 


0 02 

Wl Wb 


3.93 


1 00 

1 • WW 


115.00 


049 


1 94 

1 • W I 


0 03 

W» WW 


3 75 

\J* 9 W 


0 86 


1 95 

1 * WW 


1 00 


120 00 

J XrV< V W 


0 60 

V» ww 


2 48 


1 00 


95 00 

w w • w w 


1 00 

1 » w w 


136 00 

1 WW* WW 


0 02 

W ■ 


8 07 

W» W 1 


1 00 


73 00 


0.70 


3.36 


0.06 


6.56 


0.70 


3.66 


1.00 


114.00 


0.85 


1.30 


0.15 


15.54 



172 



WO 02/086443 



PCT/US02/12476 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



418067 


AH 27958 

#il 1 t— I www 


Hs 83393 

1 IWtWWWWW 


cvstatin E/M 

w j w k< * v t M r in 


0.81 


1.74 


418296 


C01566 

WW iwww 


Hs 86671 

1 1 w » W W W f I 


ESTs 

l» W I w 


1.00 


99.00 


418643 

■ i w w » w 


J03798 

W WW ■ WW 


Hs 86948 


small nuclear ribonucleoDrotein D1 doIvd 

w ■ 1 » Wl 1 • • W VI W Wl » 1 WW| t W W* WW t W a\W* ■ 1 *^ ■ " J r 


1.00 


60.00 


418832 


X0401 1 


Hs 88974 

1 IW*WWWf » 


cvtochrome b-245 beta DolvDeDtide fchro 


2.40 


14.74 


418945 

1 1 WW~W 


BE246762 


Hs.89499 


arachidonate S-liooxvpenase 


0.67 


3.16 


419261 

■ ■ W C W J 


X07876 

/ \w f W f W 


Hs.89791 

■ IU • W W I W 1 


wingless-type MMTV integration site fami 


1.00 


73.00 


419564 

T 1 W W W » 


U08989 

WW WW WW 


Hs 91139 

• IW«W | >WW 


solute carrier familv 1 (neuronal/eoithe 

W W t W W WJ ill W* 1 III ■ IT * 1 1 W"*l < *l I 


1.00 


192.00 


419574 

■ I w W f I 


AK001989 

r *» VW 1 W W 


Hs.91165 


hvDothetical protein 


1.00 


94.00 


419968 


X04430 

/*W"T*T WW 


Hs 93913 

1 IWaWWw 1 W 


interleukin 6 (interferon, beta 2) 

1*1 lw 1 1 W W I » 1 1 1 W lliiWMVlwllj wwiw *— y 


61.16 


500.00 


420256 

t+m w^ W V 


U84722 


Hs.76206 


cadherin 5, type 2, VE-cadherin (vascula 


0,52 


1.70 


420285 

~*W W W W 


AA258124 


Hs.293878 


ESTs, Moderately similar to ZN91 HUMAN Z 


1.00 


172.00 


420577 


AA278436 

/ U i W~WW 


Hs 186649 

1 lv« 1 WWW iW 


ESTs 


1.00 


97.00 


421262 


AA286746 

nnLUu / *tu 


Hs 9343 

I lw i W W i w 


Homo saDi'ens cDNA FLJ 14265 fis. ctone PL 

■ 1 U | | I V_i/ W L* 4 W 1 1 W if 1 I *a»W ■ • *W W W * ■ W J V 1 W ■ ■ 


1.00 


64.00 


421445 


AA913059 

nnj i wwww 


Hs 104433 

1 IW* 1 W i I WW 


Homo sapiens, clone IMAGE:4054868, mRNA 

I | Vl 1 I W UUU|Vl lvf| W * W « 1 W 1 I W M ' ^w/ r I WW I W W W J III! " ' • » 


0.88 


1.51 


421470 


R27496 

1 >«U I TW W 


Hs.1378 

1 1 W« • W t W 


annexin A3 

Ul 1 1 IwmH 1 M » W 


0.05 


11.26 


421478 


AI683243 


Hs 97258 

I IWiWI a_W w 


ESTs Moderately similar to S29539 ribos 

L>w \ W l I • Iw W*»> I ^* *vi J »*i I I iii*^' v w xx *— w ■»» * 


1.00 


73.00 


421563 

" 1 www 


NM 006433 

1 » i v I W W w "T W W 


Hs 105806 

1 1 W • 1 wwwww 


aranulvsin 

W | k^J 1 IUII W|IP 


0.82 


2.42 


421566 

~i* IWWW 


MM 000399 

1 t 1 T I. .WWWWWW 


Hs.1395 


earlv arowth response 2 (Krox-20 (Drosop 

X« III 1 V* 11 li 1 1 *xw v vi iw%# I 1 vi w / » w \™" • w**»» r~ 


5.50 


31.57 


421 855 

c 1 WWW 


F065O4 

1 www W » 


Hs 27384 


ESTs, Moderately similar to ALU4 HUMAN A 


1.00 


129.00 


421913 

I w 1 w 


A1934365 

f\* WW « w w w 


Hs 109439 

I IW* 1 W W i W \J 


osteoalvcin (osteoinductive factor, mime 

\*j w iv w 7 y it w HI iwu \ i^/ iii w w w ■ i ' j i<ii*i iw 


1.00 


101.00 


421952 


AA300900 

# ** iwwwwww 


Hs.98849 

\ \ W « W Vrf W IW 


ESTs, Moderately similar to AF1 61 51 1 1 H 


0.60 


63.60 


422232 


D43945 


Hs.1 13274 

1 IW» 9 J WCb 1 ■ 


transcription factor EC 

11 1 1 W W 1 1 W \t W II 1 WW l>W 1 t-^ 


1.00 


148.00 


422386 

t»W WW 


AF1 05374 

1 11 I WW^WP i 


Hs. 115830 


heparan sulfate (glucosamine) 3-0-sulfot 


1.40 


3.98 


423168 


R34385 


Hs. 124940 

1 IW* 1 » w 


GTP-bindina protein 

M t 1 W 1 I IU II 'if t *vl • P 


0.34 


3.59 


423196 

~fcW 1 WW 


AK001866 

P 11 >W W 1 W V W 


Hs.1 25139 

1 iW * 1 *— W 1 WW 


hypothetical protein FU11004 


0.55 


2.00 


423387 


AJ01 2074 

nUV 1 — W 1 ■ 




vasoactive intestinal peptide receptor 1 

V Li w W UU L 1 v w 1 1 hWUU | IUI WWW VI W V WWWW % w 1 1 


0.09 


2.13 


423424 


AF1 50241 


Hs 128433 

I IW 1 1 aCWTWW 


oroslsalandin D2 synthase hematopoietic 

uiyjkoyiuiiudi >— ' wT*f»(fwwwp f iwi i iwtvi/vivuw 


too 


141.00 


423456 


AL1 10151 

nL 1 1 W • W 1 


Hs.1 28797 

1 *W • | £m\J 9 W # 


DKFZP586D0824 protein 

1 \l *— 1 W W W*W WW A* 1 Wl W IWI 1 ■ 


1.00 


66.00 


423696 

~t www w 


Z92546 




Sushi domain (SCR repeat) containinq 


0.73 


1.27 


424027 


AW337575 


Hs.201591 

i 1 J'tU IWW I 


ESTs 


0.54 


2.58 


424212 


NM 005814 

HIT! WWWW 1 1 


Hs.143131 

1 IW* | l W 1 W f 


alvcoorotein A33 (transmembrane) 

VJ | ■ %pf ^pT ppf | \ W III 1 1 1 1*1 *J^* 1 I • P ■ 1 I * ™» P P P M 


0.77 


2.47 


425087 


R62424 


Hs 126059 

1 1 W » 1 LUvVW 


ESTs 

1 w 


1.00 


74.00 


495175 

ttv I/O 


AF020202 

f\t W— w £. W — 


Hs 155001 

1 1 w« I WWW w 1 


UNCI 3 (C eleaansl-like 

VJ 1 T W 1 W 1 w^i wl W W Ul IW J 1 II VW 


0.85 


1.96 


425771 


BE561776 


Hs 159494 

1 Ivi 1 ww~w • 


Bruton aaammaolobulinemia tyrosine kinas 

wi fcp i i w*23 iii' **^-yii^* T w i w» * ii*ph J w ■ * p ■ 


1.18 


2.56 


426486 


BE1 78285 


Hs 170056 

I IW* | i wwww 


Homo sapiens mRNA; cDNA DKFZp586B0220 (f 

I I Wl 1 4 W U(JWIV< IW HH ll II ■ | W*^l ~* * 1^1 W W W W fc* w »i«v 


1.00 


76.00 


427507 

it* | W W 1 


AF240467 


Hs.179152 

1 IW* 1 1 w I V»— 


toll-like receptor 7 

LWI 1 1 1 MV 1 WWW WW 1 1 


1.00 


63.00 


427618 

f U IV 


MM 000760 

1 11 V 1 WWW* WW 


Hs.2175 

1 IW»*» | | W 


colonv stimulatina factor 3 receptor (qr 

( W I ■ ¥ VP 1,1 | 1 IM 1 W M 1 • VJ 1 W*W *j W ■ » W»'f' ■ | V| P 


0.60 


2.19 


427732 

it. I 1 W£- 


mm 002980 


Hs.2199 

1 1 W • *W 1 ww 


secretin receptor 


0.97 


1.42 


427952 

"fa ■ WW«V 


AA765368 

n/ii wwwww 


Hs.293941 


ESTs. Moderately similar to A53959 throm 


1.00 


105.00 


428709 


BE268717 


Hs. 1049 16 

1 1 W / * w * w * w 


hypothetical protein FLJ21940 


1.00 


80.00 


428769 

r W I W W 


AW207175 


Hs.1 06771 

• IW* 1 WWf ■ ■ 


ESTs 


0.09 


2.55 


428780 


AI478578 

l\| i t WWI w 


Hs.50636 

1 IW*^/WWWW 


ESTs 


1.00 


98.00 


428833 


AI928355 


Hs 185805 

| IW* 1 wwwww 


ESTs 

W W 1 w 


1.00 


113.00 


429657 


D13626 

LJ | w W— W 


Hs 2465 


KIAA0001 oene product: putative 6-protei 

1 vnnvvw i m v>* iw wiwwuwij ww**w*ki*w wiw*>wi 


1.00 


52.00 


430212 


AA469153 




gb:nc67f04.s1 NCLCGAP_Pr1 Homo sapiens 


1.00 


132.00 


430226 


BF245562 


Hs 2551 

1 lw»«WW W 1 


adrenerotc beta-2- receptor, surface 

14 W 1 ul IW| w 1 Wj W W 1 W> A. | 1 W W w w LWI | WWII Uyw 


0.11 


15.60 


430376 


AW292053 

ni? Aw— www 


Hs 12532 

1 1 W« | «UWW— 


chromosome 1 ooen readino frame 21 

Wl ii wi I iwwwi iiw i wwwii i www ii ly iiwiiiw *wi 


1.00 


103.00 


430414 


AW365665 

♦ \ ¥ 1 www www 


Hs 120388 

1 lw« | «t_ W w W W 


ESTs 

WW 1 w 


0.50 


6.96 


430656 

r W W WW W 


AA482900 


Hs 162080 


ESTs 


1.00 


70.00 


430843 

"v WW » W 


AI734149 

til f W*T 1 ■ W 


Hs 119514 

1 IW* | 1 WW * > 


ESTs 

InW 1 W 


1.00 


90.00 


430998 

"WWW WW 


AF1 28847 

#ll 1 pww w~ i 


Hs 204038 

1 IW«akaW~VWW 


indolethvlamine N-methvltransferase 

1 t IVI W I W IIIJI P*rf*l III* |W it II ■ W 11 1 I HI P— • ■ IWI P *^w w 


0.29 


1.84 


431217 

~W 1 «— 1 J 


mm 013427 


Hs 250830 

1 IW*a^WwWWV 


Rho GTPase activatino protein 6 


1.00 


79.00 


431921 

"Tw I w*» 1 


N46466 

1 1™ w • w w 


Hs 58879 

1 IWaWWWl W 


ESTs 

l— 1 W 


0.91 


1.67 


432176 


AW090386 


Hs 112278 

1 1 W , 1 > flk^JW 1 w 


arrestin. beta 1 


0.66 


2.63 


432203 

~w £.*UW W 


AA305746 


Hs.49 


macrophaoe scavenqer receptor 1 


1.00 


76.00 


432231 


AA339977 

nnvw w w i i 


Hs 274127 

1 IWtlh 1 ~ 1 *■ ■ 


CLST 11240 protein 

wUV 1 II P— • W Wl W^WM I 


0.46 


1.46 


432485 


N90866 

( VW WwWW 


Hs 276770 

f *Wfl_# W f # W 


CDW52 antiqen (CAMPATH-1 antiqen) 

\*SL^ m W w 4-m WJ » 1 "13 W^p » I ll Iff * 1 f • l p **• JJ » * 


0.79 


2,25 


432522 


D11466 


Hs 51 

1 IW»W 1 


nhosDhatidvlinosital olvcan class A (oa 

UilUUUIILiUUIIM IWwl WJ 1 MIIUUII) WIWJWW P 1 ^ f-* 


1.93 


4.83 


432596 


A 1224741 


Hs 278461 


matrilin 3 

1 1 IQll II II 1 W 


0.04 


5.79 


432850 


X87723 

/AW r I C, W 


Hs 3110 

1 IW i W 1 I w 


anaiolenstn recsoior 2 

VJI ImI W w 1 1 W II 1 1 WWW Ulvl *» 


1.00 


167.00 


433138 

*TWW 1 uU 


AB029496 


Hs 59729 

1 |w*W W 1 *_ w 


semaDhorin sem2 

WWl 1 IWMI IWI III WWII lb 


0.04 


9.16 


433563 


A1732637 


Hs 277901 

1 \\J • i— t 1 WW 1 


ESTs 

L_ v 1 W 


1.00 


91.00 


433588 


AI056872 


Hs 133386 

1 1 W » 1 wwwww 


ESTs 


120.16 


315.00 


434445 


A1349306 


Hs 11782 

1 Jw« 1 1 t W*w 


ESTs 


0.60 


1.84 


435496 


AW840171 


Hs 265398 

1 IwvtCWWWWW 


ESTs Weaklv similar to transformation-r 

1^ W 1 V) wVwvll\ljr W|l| IIIUI IW UUIIWIvl II Iblllvll P 


1.00 


128.00 


435974 


U29690 

U— WW WW 


Hs 37744 

1 1 W* W I r "T~ 


Homo sapiens beta-1 adreneroic receptor 

I IWI 1 IW WWWIWIIW VUIU 1 UMIVIlWiyiV IWWW^»*wi 


1.00 


108.00 


436061 


Al 248 584 


Hs 190745 

1 1 w , | WW i * W 


Homo saDiens cDNA: FLJ21326 fis. clone C 

| | W III W wQUlWllw W *w 111 ti 1 p—w 1 W W iPW|Wiwiiw 


1.00 


91.00 


437157 

~W t 1 w r 


BE048860 

l—f La W I WwWW 


Hs 120655 

1 1 W « 1 aWWWWW 


ESTs 

l^pp^p* I w 


1.00 


87.00 


437207 

" W r -Cw 1 


T27503 

1 £m f WWW 


Hs 15929 

1 1 W • 1 WW*— w 


hypothetical protein FLJ12910 

I If WWW 1 W VI WWI Wl W LWl 1 1 I ha»V 1 «ba W 1 W 


1.00 


105.00 


43731 1 

» W (Oil 


AA370041 

n/*w i ww I i 


Hs 9456 

1 IW*W >ww 


SWI/SNF related, matrix associated, acti 

Vpr W W 49 Vpf 1 II 1 \^I«H* »W VP 1 1 P 1 tn*J**l I* » W W W t *>W Wf »» 


1.00 


71.00 


437439 

"w r *f ww 


H29796 

1 *£+ W f WW 


Hs 269622 

1 1 W t — W W Wflb *b 


ESTs 

pWb W f W 


1.00 


115.00 


438199 

"OU 1 WW 


AW0 16531 

r\f ¥ W 1 WWW J 


Hs 122147 

1 itfi 1 fab l~r 


ESTs 

IvV i w 


1.00 


80.00 


439551 

i w w w w i 


W72062 


Hs 11112 

1 1 W« 1 1 1 l 


ESTs 

|_*W P w 


0.30 


3,10 


440515 

Ttwv 1 w 


AJ131245 

Ov 1 W 1 ■£» » W 


Hs 7239 

1 IW • * LU w 


SEC24 IS cerevls'iae) related aene famil 

V* I— V»/ »^ Tt W* WWI V» T IWIU w I 1 wiwiw W M wi 1 w 1 wi 1 ill 


1.00 


77.00 


440887 


AI799488 


Hs 135905 

1 IWi 1 wwwww 


ESTs 

Uv • w 


1.00 


85.00 


441025 


AA913880 

#u» w I WW WW 


Hs 176379 

1 1 W • 1 i WW | w 


ESTs 


1.00 


82.00 


441384 

• i i ww™ 


AA447849 


Hs.288660 

* IWlAWWWWWW 


Homo sapiens cDNA: FLJ22182 fis, clone H 

I IVI ■ I** W*^PP> IWI 1 W WW 1 If *l • P^W *W 9 ^P*"* P IW J ^* • | 


0.79 


1.89 


441735 

Tt 1 f ww 


A1738675 

/»! 1 WWW* W 


Hs 127346 

■ lv» 1 W~W 


ESTs 

1— V-* 1 w 


1.00 


75.00 


442200 


AW590572 

|~i»»wWWW| c 


Hs 235768 

1 IW*— ww* WW 


ESTs 

1 — > v> 1 w 


0.78 


5.83 


442832 


AW206560 


Hs.253569 


ESTs 


0.03 


10.88 


442957 


A1949952 


Hs.49397 


ESTs 


1.00 


70.00 


443282 


T47764 


Hs.132917 


ESTs 


1.00 


197.00 


443547 


AW271273 


Hs.23767 


hypothetical protein FLJ12666 


1.00 


253.00 


443951 


F13272 


Hs.111334 


ferritin, light polypeptide 


0.55 


2.09 


444330 


AI597655 


Hs.49265 


ESTs 


1.00 


90.00 
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A A Mr- A r- 

444515 


i i * >a* a Ann 

AW204908 


Hs.1 69979 


ESTs 


1.0U 


qa nn 
04.UU 


445769 


AI741471 


Hs.23666 


ESTs 


0.02 


A OO 

4.3a 


445908 


R13580 


Hs.13436 


Homo sapiens clone 24425 mRNA sequence 


a rsr\ 

1.00 


m nn 
97.UU 


446291 


BE397753 


ii a a a n n 

Hs. 14623 


interferon, gamma-inducible protein 30 


A no 

0.93 


A en 
1.69 


446917 


AI347863 


i 9 A AAA*TA 

Hs.1 56672 


ESTs 


■f Art 

1.00 


4nc nn 
IUd.OU 


447261 


NM_006691 


Hs.17917 


extracellular link domain-containing 1 


A An 
U.4U 


At OA 


447432 


AW958473 


ll A n a n 

Hs.301957 


nudix (nucleoside diphosphate linked moi 


1.00 


inn nn 
1UU.UU 


447482 


AB033059 


Hs. 18705 


KIAA1233 protein 


A AC 
U.05 


o.^l 


447997 


H00656 


1 1 nA^A a 

Hs. 29792 


ESTs, Weakly similar to 138022 hypotheti 


A AO 


C AO 


448299 


A A J A*TA J J 

AA497044 


Hs.20887 


hypothetical protein FU 10392 


"1 AA 
1.00 


7q nn 
/y.UU 


448782 


AL050295 


Hs.22039 


KIAAQ758 protein 




1 .00 


A. r— f\ r* ^ 

450575 


NM_005859 


1 1_ on* <<"7 

Hs.29117 


punne-ncn element binding protein A 


U.l/ 


n.j»3 


450584 


a A r\ a A inn 

AA040403 


Hs.60371 


ESTs 


1 Af\ 


nn 

o4.UU 


450693 


a i a i j r A a r> A 

AW450461 


Hs.203965 


ESTs 


l.UU 


01 nn 
yi .uu 


450715 


Al 266484 


1 1 — oh nA 

Hs.31570 


ESTs, Weakly similar to KlAAlo^4 protein 


1 AA 


1 CO AA 

I oz.uu 


451103 


R52804 


Hs.25956 


DKFZP564D206 protein 


4 nn 
l.UU 


nn 
ob. UU 


451220 


A r - a a A A r- A 

AF1 24251 


l l nnnr* J 

Hs.26054 


novel SH2-contammg protein 3 


A cn 
U.bU 


1 ^A 

l.oU 


451668 


Z43948 


Hs.326444 


cartilage acidic protein 1 


A C>l 

U.54 


i.yi 


452197 


AW023595 


Hs,232048 


ESTs 


1.00 


C7 nn 
D/.UU 


452331 


M598509 


Hs.29117 


purine-rich element binding protein A 


A CO 

4.53 


1 1 n7 

n.u/ 


452353 


C18825 


Hs.29191 


epithelial membrane protein 2 


0.72 


o o/ 
2.24 


453049 


BE537217 


II n a a A n 

Hs.30343 


r— n,"H" 

ESTs 


i An 
1,00 


cq nn 
bo.UU 


453107 


1 ri 1 A A A A A A 

NM_016113 


Hs.279746 


vanilloid receptor-like protein 1 


A Q9. 


1 7A 

l.fU 


453355 


III t r> r\ i— r\ —y A 

AW295374 


11— A J Jil A 

Hs.31412 


Homo sapiens cDNA FLJ11422 fis, clone Ht 


i nn 
l.UU 


iqo nn 
lo^.uu 


453390 


A */-«,/-> j-* AAA 

AA862496 


1 I nn Ann 

Hs.28482 


ESTs 


4 nn 
l.UU 


70 AA 
f Z.UU 


4WW J 






CQT- \AJoaUw dmllar tn 10^70^ mPP nrnt 


1 on 


68 00 


454741 


BE1 54396 




gb:CM2-HT0342-091299-050-b05 HT0342 Homo 


0.57 


2.89 


456579 


AA287827 


Hs.284205 


up-regulated by BCG-CWS 


1.00 


82.00 


456672 


AK002016 


Hs. 114727 


Homo sapiens, clone MGC: 16327, mRNA, com 


0.79 


1.96 


457400 


AF032906 


Hs.252549 


cathepsin Z 


1.03 


3.25 


457718 


F18572 


Hs.22978 


ESTs, Weakly similar to ALU4_HUMAN ALU S 


1.00 


113.00 


459696 


F03027 




gb:HSC1KA072 normalized infant brain cDN 


1.00 


544.00 



TABLE 1 0B 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey 
408074 

411667 
413533 



423696 

430212 
436532 
453531 
454741 



CAT Number 
103684J 

1253334J 
1375344J 



423387 22779J 



231 12J 

314437 1 
421802.1 
97026J 
1 232559 J 



Accession 

R20723 AA263003 AA333976 M334725 M334151 AW965490 M310513 AI810530 D31302 AW134897 AA830127 AA046953 AI668930 
C06094AW1 04534 

BE160198 AW935898 T11520 AW935930 AW856073 AW861034 

BE146973 BE146972 BE147042 BE147018 BE146783 BE147020 BE146781 BE147019 BE146766 BE147021 BE146952 BE146767 BE147044 
BE146797 BE146776 BE146985 BE146793 BE146768 BE146771 BE146954 BE146760 BE147048 BE147025 BE147030 
AJ012074 U11087 L13288 X75299 L20295 AW630780 H14880 T28037 A1872991 R72136 AW449839 T81622 T79697 T29519 R94105 T83923 
R73300 AI797007 R73390 AA961010 H74168 A1689932 BE045543 AI808418 AI608912 AI806573 AW884084 AW872978 AW872985 AA565655 
AI022915 R50647 R73210 H45098 R46451 AW166269 T71 132 AI264547 R52146 AI304920 R73391 AW884059 AW884085 H73241 T60038 
T79612 R731 45 R50549 AI094557 AI668793 R72302 AI564366 W01 956 M41 8962 W32571 R72840 H45409 R72085 R46356 R46758 
AA508805 AA418798 T83751 R94072T16182AA928785 AA903896 

Z92546 AA330586 AI570568 AW341487 AI827050 AW298668 AI792189 AI015693 AI733599 AI572251 AI672488 AW1 93262 A1244716 

AI864375 AI206100 AA91 2444 AI269365 AI640254 AW772466 AI867336 AA627604 H1 6914 AA358477 M338009 

M4691 53 AI71 8503 M469225 

AA721522 AW975443 T93070 

AA417940M036735T07025 

BE154396 AW817959 BE154393 



TABLE 10C 



Pkey; 
Ref: 

Strand: 



Unique number corresponding to an Eos probeset 

Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled "The DNA 
sequence of human chromosome 22." Dunham I. et al., Nature (1999) 402:489-495. 
Indicates DNA strand from which exons were predicted. 



NLposition: Indicates nucleotide positions of predicted exons. 

Pkey Ref Strand NLposition 

400754 7331445 Plus 144559-144684 

401045 8117619 Plus 90044-90184,91111-91345 

401083 3242744 Plus 33192-33360 

402474 7547175 Minus 53526-53628,55755-55920,57530-57757 

402808 6456148 Minus 114964-115136,115461-115585,115931-116047,117666-117771,118004-118102 

403021 7547270 Plus 120799-120966 

403421 9665041 Minus 126609-126773,139986-140205 

403438 9719679 Plus 90792-90938 

403687 7387384 Plus 9009-9534 

403764 7717105 Minus 118692-118853 

404277 1834458 Minus 91665-91946 

404288 2769644 Plus 3512-3691 

404394 3135305 Minus 37121-37205,37491-37762,4105341140,41322-41593,41773-41919 

404518 8151988 Plus 84494-84603 

404916 7341826 Plus 91057-91188 

405106 8079395 Minus 80877-81418 

405257 7329310 Plus 73121-73273 

405381 6006920 Minus 7636-8054 
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WO 02/086443 

406387 9256180 Plus 



116229-116371,117512-117651 



PCT/US02/12476 



175 



WO 02/086443 

TABLE 11 A: Genes Distinguishing Adenocarcinoma from Other Lung Diseases and Normal Lung 



PCT/US02/12476 



Table 11A shows about 84 genes upregulated in lung adenocarcinomas relative to other lung tumors, non-malignant lung disease, and normal lung. These genes were selected 
from about 59680 prabesets on the Eos/Afrymetrix Hu03 Genechip array. 

Table 1 1 B show the accession numbers for those Pkey's lacking UnigenelD's for table 1 1 A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Toots (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed In the 
"Accession" column. 

Table 1 1C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 1 1A, For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: 
ExAccn: 
UnigenelD: 
Unigene Title: 
R1: 

R2: 



Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

Average of lung tumors (including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid tumors) divided by the 
average of normal lung samples 

Average of non-malignant lung disease samples (including bronchitis, emphysema, fibrosis, atelectasis, asthma) divided by the average of normal lung samples 



Pkev 


ExAccn 


UniaenelD 


Unloene Title 

If* ™» V 1 \r 9 9 %9 


R1 


R2 


403329 






Target Exon 


1.00 


61.00 


406399 






NM_003122*:Homo sapiens serine protease 


1.00 


39.00 


406690 


M29540 


Hs.220529 


carcinoembryonic antigen-related cell ad 


226.37 


350.00 


4Q7869 


A1827976 


Hs.24391 


hypothetical protein FLJ13612 


0.77 


1.18 


407881 


AW072003 


Hs.40968 


heparan sulfate (glucosamine) 3-O-suIfot 


1.00 


10.00 


408908 


BE296227 


Hs.250822 


serine/threonine kinase 15 


7.76 


1.00 


409103 

T \y v 9 \* v- 


AF251237 


Hs. 112208 


XAGE-1 protein 


80.44 


40.00 


409187 


AF154830 

9 11 * 1 Vr 


Hs.50966 


carbamoyl-phosphate synthetase 1, mitoch 


1.00 


1.00 


409269 

* W W V V* 


AA576953 


Hs.22972 


hypothetical protein FLJ13352 


1.00 


1.00 


410076 


T05387 


Hs.7991 


ESTs 


1.12 


1.50 


410102 


AW248508 


Hs.279727 


Homo sapiens cDNA FLJ 14035 fis, clone HE 


9.89 


1.00 


410399 


BE068889 




synuclein, gamma (breast cancer-specific 


0.92 


1.06 


411908 


L27943 


Hs.72924 


cytidine deaminase 


1.00 


1.00 


412612 


NM 000047 


Hs.74131 


arylsulfatase E (chondrodysplasia puncta 


1.02 


1.03 


414075 


U11862 


Hs.75741 


amiloride binding protein 1 (amine oxida 


0.84 


1.07 


416208 


AW291168 


Hs.41295 


ESTs, Weakly similar to MUC2_HUMAN MUCIN 


3.67 


1.00 


417542 


J04129 


Hs.82269 


progestagen-associated endometrial prate 


1.28 


1.35 


419183 


U60669 


Hs.89663 


cytochrome P450, subfamily XXtV (vitamin 


1.00 


1.00 


419502 


AU076704 




fibrinogen, A alpha polypeptide 


13.05 


115.00 


419631 


AW188117 


Hs.303154 


popeye protein 3 


1.00 


13.00 


420931 


AF044197 


Hs.100431 

9 9SJ 9 9 1 w • 


small inducible cytokine B subfamily (Cy 


1.00 


8.00 


421155 


H87879 


Hs. 102267 


Ivsvl oxidase 


1.00 


15.00 


421190 


U95031 

w vf V W • 


Hs. 102482 


mucin 5, subtype B, tracheobronchial 


1.17 


1.55 


421474 

J I— | l^ * T 


U76362 


Hs. 104637 


solute carrier family 1 (glutamate trans 


1.46 


1.76 


421515 


Y11339 


Hs. 105352 


GalNAc alpha-2, 6-sialyl transferase ), ) 


1.00 


3.00 


421582 


A19 10275 




trefoil factor 1 (breast cancer, estroqe 


1.23 


1.00 


422026 


U80736 


Hs.1 10826 


trinucleotide repeat containino 9 


1.00 


52.00 


422095 


AI868872 


Hs.282804 


hypothetical protein FLJ22704 


4.37 


2.34 


42231 1 


AF073515 


Hs.1 14948 


cytokine receptor-like factor 1 


1.15 


1.78 


422867 


L32137 


Hs.1 584 


cartilaqe oliaomeric matrix protein (pse 


1.69 


3.17 


423472 


AF041260 

• 1# V* 1 W Ma V w 


Hs. 129057 


breast carcinoma amplified sequence 1 


48.13 


72.00 


423554 


M90516 


Hs.1 674 


Qlutamlne-fructose-6-DhoSDhate transamin 


1.00 


50.00 


424502 


AF242388 

1 11 1 w 


Hs.1 49585 


lengsin 


1.00 


1.00 


424544 


M88700 


Hs.1 50403 


dopa decarboxylase (aromatic L-amino aci 


1.00 


59.00 


424905 


NM 002497 

1 1 111 VSWa^ ' w * 


Hs. 153704 


NIMA (never in mitosis gene a)-related k 


21.35 


1.00 


424960 


BE245380 


Hs.153952 


5' nucleotidase (CD73) 


1.00 


1,00 


425523 


AB007948 


Hs.158244 


KIAA0479 protein 


1,00 


35.00 


426230 


AA367019 


Hs.241395 


protease, serine, 1 (trypsin 1) 


1.00 


83.00 


427701 


AA411101 


Hs.243886 


nuclear autoantigenic sperm protein (his 


7.41 


34.00 


428585 


AB007863 


Hs.185140 


KIAA0403 protein 


1.00 


6.00 


428758 


AA433988 


Hs.98502 


hypothetical protein FLJ 14303 


1.06 


1.13 


429170 


NM 001394 


Hs.2359 


dual specificity phosphatase 4 


16.18 


105.00 


429263 


AA019004 


Hs.198396 


ATP-binding cassette, sub-family A (ABC1 


1.07 


1.00 


429610 


AB024937 


Hs.211092 


LUNX protein; PLUNC (palate lung and nas 


1.59 


1.69 


430508 


AI015435 


Hs.104637 


ESTs 


4.75 


7.27 


430985 


AA490232 


Hs.27323 


ESTs, Weakly similar to I78885 serine/th 


0.94 


1.28 


431548 


A1834273 


Hs.9711 


novel protein 


5.66 


15.00 


431566 


AF176012 


Hs.260720 


J domain containing protein 1 


49.76 


37.00 


431986 


AA536130 


Hs.1 4901 8 


Novel human gene mapping to chomosome 20 


1.19 


1.47 


432375 


BE536069 


Hs,2962 


S100 calcium-binding protein P 


1.65 


1.06 


432677 


NM_004482 


Hs.278611 


UDP-N-acetyl-alpha-D-galactosamine:polyp 


1.00 


48,00 


433556 


W56321 


Hs.1 11460 


calcium/calmodulin-dependent protein kin 


1.00 


19.00 


433819 


AW511097 


Hs.1 12765 


ESTs 


3.71 


8.00 


434001 


AW950905 


Hs.3697 


serine (or cysteine) proteinase inhibito 


29.31 


72.00 


434424 


A1811202 


Hs.325335 


Homo sapiens cDNA: FLJ23523 fis, clone L 


1.00 


64.00 


434792 


AA649253 


Hs. 132458 


ESTs 


8.52 


44.00 


436217 


T53925 


Hs.107 


fibrinogen-iike 1 


57.97 


31.00 


436749 


AA584890 


Hs.5302 


lectin, galactoside-binding, soluble, 4 


1.10 


1.41 


436972 


AA284679 


Hs.25640 


claudin 3 


1.59 


1.46 


437866 


AA156781 




metallothionein 1E (functional) 


3.62 


101.00 


437935 


AW939591 


Hs.5940 


mucin 13, epithelial transmembrane 


1.60 


1.39 


438915 


AA280174 


Hs.285681 


Williams-Beuren syndrome chromosome regi 


1.00 


1.00 


439451 


AF086270 


Hs.278554 


heterochromatin-like protein 1 


23.28 


52.00 
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439759 


AL359Q55 


Hs. 67709 


Homo sapiens mRNA full length insert cdn 


A nn 
I.UU 


ii nn 
Zl.UU 


441031 


An 10684 


Hs.7645 


fibrinogen, B beta polypeptide 


A MA 

1.41 


do nn 

yy.uv 


441377 


BE218239 


Hs.202656 


ESTs 


22.03 


A nn 

1.00 


443614 


AV655386 


Hs.7645 


fibrinogen, B beta polypeptide 


i nn 

1.00 


•I c nn 

16.00 


443813 


AA876372 


Hs.93961 


Homo sapiens mRNA; cDNA DKFZpo67D095 (fr 


a in 
1.ZU 


A on 

i.yy 


443991 


NM_002250 


Hs.10082 


potassium intermediate/small conductance 


5.71 


6.87 


444670 


H58373 


Hs.332938 


hypothetical protein MGC5370 


1.98 


oo. 0U 


444931 


AV652066 


Hs.75113 


general transcription factor IHA 


4 AA 

1.00 


ca nn 

54.00 


446102 


AW168067 


Hs. 3 17694 


ESTs 


a rsf\ 

1.00 


A nn 

1.00 


446163 


AA026880 


Hs.25252 


Homo sapiens cDNA FU 13603 fis, clone PL 


a nn 

1.00 


■ae nn 
ob.UU 


A A i r*n 

446469 


BE094848 


Hs.15113 


homogentisate 1,2-dioxygenase {homogenti 


a nn 


I < on 

I I .UU 


447388 


itl /aaapo J 

AW630534 


Hs.76277 


Homo sapiens, clone MGC.9381, mRNA, comp 


1.24 


A AH 


447532 


AKQ0Q614 


Hs. 18791 


hypothetical protein FLJ^ObUY 




i.bo 


44oi4d 


AXM'iCmiA 

AWoby/ / I 


Li _ encin 
HS.o^b^U 


integnn, beta o 


-1 C QA 

10.04 


1 nn 

I .UU 


J J nn A A 

448844 


AI581519 


II _ 4-7-74CJ 

Hs. 1771 64 


ESTs 


a nn 
l.UU 


ol .UU 


449444 


AW818436 


Hs.23590 


solute carrier family 16 (monocarboxylic 


1.00 


83.00 


451807 


W52854 




hypothetical protein FLJ23293 similar to 


1.55 


35.00 


452689 


F33868 


Hs.284176 


transferrin 


1.54 


1.44 


453392 


U23752 


Hs.32964 


SRY (sex determining region Y)-box 1 1 


• 1.00 


16.00 


453464 


A188491 1 


Hs.32989 


receptor (calcitonin) activity modifying 


1.55 


2.45 


453735 


AI066629 


Hs.125073 


ESTs 


1.01 


1.30 



TABLE 11B 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 

Pkey CAT Number Accession 

410399 11995 1 BE068889 BE068882 AF044311 AF017256 NM_003Q87 AF037207 AF010126 AA633976 AA872836 BE298825 BE299889 A1016464 AI684600 

A1936527 AA804675 AA394097 AI139933 AA946606 BE171313 AA722407 AA293803 AI468480 M056035 AA055968 AW796957 AI637713 
AA41 0737 H49348 AA486472 AA41 1 094 AA235594 AA402624 AA443638 AW452137 AA421 708 AW26521 1 AI493266 AA3651 32 AW966044 

419502 18535J AU076704 T74854 T74860 T72098 T73265 T73873 T69180 T74658 T58786 T60385 T73410 T68781 T67845 T67593 T73952 T67864 T60630 

T68367 T68401 T53959 T72360 T72099 T60377 T58961 T7171 2 T72821 T64738 T74645 T72037 T68688 T72063 T73258 T72826 T64242 
T68220 T74673 T71800 T68355 T61227 T62738 T69317 T53850 T64692 T73768 T73962 T73382 T68914 T70975 T73400 T60631 T73277 
T73203 T70498 T61409 T58925 NM_000508 M64982 T68301 T73729 T69445 T60424 T67922 T67736 T68716 T67755 T74765 T73819 T58719 
T74756 T60477 T74863 T61 109 T68329 T58850 T71857 T73425 T53736 T68607 T58898 T64309 T72031 T72079 T64305 T71908 T681 07 
T71916 T73787 T56035 T64425 T71870 T60476 T61376T67820 T71895 T41006 T69441 T68170 T74617 T71958 T69440 T61875 R06796 
H48353 T71914 T53939 T641 21 AA693996 T72525 T67779 T68078 AA01 1465 AA345378 AV654847 AV654272 AV656001 AI064740 T82897 
N33594 M344542 AW805054 AI207457 T61743 AA026737 H94389 AA382695 AA918409 T68044 S82092 T39959 AI017721 M312395 
AA312919 T40156 H66239 AV652989 H38728 R98521 AV655200 R95790 W03250 W00913 AA344136 AV660126 R97923 AA343596 
AW470774 AV651256 N54417AA8 12862 AW1 82929 All 11 192 H61463 H72060 AA344503 H38639 AI277511 AV661108 AI207625 T47810 
AA235252 T27853 T47778 R95746 H70620 M701463 AW827166 R98475 C20925 AV657287 T71959 T71313 T73920 T73333 T61618 T69293 
T69283 T73931 T721 78 T72456 AV645639 AV653476 T72957 T72300 T58906 T71457 T70494 T72956 T70495 T68267 T74407 T85778 
AA344726 T27854 T74485 T74101 T73868 T71518 T72304 AA343853 T73909 T68070 T72065 H72149 T73493 T73495 AV645993 R02293 
T70475 T64751 AA344441 AA343657 AA345732 AA344328 AI1 10639 AA344603 AF06351 3 T64696 T68516 T72223 T60507 T67633 R29500 
T72517 R02292 T60599 T69206 T70452 T74677 R29366 T61 277 T74914 T60352 R29675 T74843 AV645792 AA344408 T691 97 T72057 
T69368 T69358 T68258 AV650429 T73341 T61702 T74598 T40095 K02272 T40106 AA343045 AA341908 AA341907 AA342807 AA341964 
T53747 T72042 T62764 AI064899 AA343060 T67832 T72440 T71770 T68091 T69108 T72449 T69167 T71289 T68251 AV654844 T64375 
AA345234 T67598 M01 1 414 T68036 H48262 AI207557 T6821 9 W86031 T69081 T64232 R931 96 T62136 AV650539 H67459 T72978 
AA344583T60362H58121 T95711 T72803T68055T71715 R29036T72793 T69122T64595T62888T69139T68291 T64652 T67971 T46862 
AA693592 AI248502 R29454 T64764 T57001 T73052 T71429 T51 1 76 T58866 AV655414 H90426 AA342489 T73666 T67848 T72512 T53835 
T67837 T73317 T74273 T69420 T68245 T74380 T67862 T74474 T56068 

421582 2041 1 AI910275 X00474 X52003 X05030 NM 003225 AA314326 AA308400 AA506787 AA314825 A1571948 AA507595 AA614579 AA587613 R83818 

AA568312AA614409AA307578AI925552AW950155A1910083M12075 BE074052 AW004668 AA578674 M582084 BE074053 BE074126 
BE074140 AA514776 AA588034 BE074051 BE074068 AW009769 AW050690 AA858276 R55389 AI001051 AW050700 AW750216 AA614539 
BE074045 AI307407 AW602303 BE073575 A1202532 AA524242 AI970839 AI909751 BE076078 AI909749 R55292 

437866 44433 2 AA156781 AW293839 U52054 AA024963 AA778446 BE073977 AW444904 AW602574 BE164040 BE164012 BE163972 BE163974 BE163992 

AA837481 AW468444 BE185091 AW468002 AA687333 AA81 1830 AA581806 AI866686 AI572124 M043777 AA040926 D20160 AI536733 
AA812489 AW874142 AI471883 W84421 AA156850 

451807 8865J W52854 AL1 17600 BE208116 BE208432 BE206239 BE082291 AW953423 AA351619 BE180648 B E1 40560 W60080 AA865478 N90291 

AW450652 AW449519 AA993634 AI806539 AA351618 AW449522 A1827626 AA904788 AA380381 M886045 AA774409 BE003229 Z41756 



TABLE 11C 

> 

Pkey: Unique number corresponding to an Eos probeset 

Ref: Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled The DNA 

sequence of human chromosome 22." Dunham I. et al., Nature (1999) 402:489-495. 
Strand: Indicates DNA strand from which exons were predicted. 
NLposition: Indicates nucleotide positions of predicted exons. 



Pkey 

403329 

406399 



Ref 

8516120 
9256288 



Strand 

Plus 

Minus 



NLposition 

96450-96598 

63448-63554 
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TABLE 12A: Genes Distinguishing Squamous Cell Carcinoma from Other Lung Diseases and Normal Lung 

Table 12A shows about 72 genes upregulated in squamous cell carcinomas of the lung relative to other lung tumors, non-malignant lung disease, and normal lung. These genes 
were selected from about 59680 probesets on the Eos/Affymetrix Hu03 Genechip array. 

Table 12B show the accession numbers for those Pke/s lacking UnigenelD's for table 12A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 12C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 12A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: 
ExAccn: 
UnigenelD: 
Unigene Title: 
R1: 

R2: 



Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

Average of lung tumors (including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid tumors) divided by the 
average of normal lung samples 

Average of non-malignant lung disease samples {including bronchitis, emphysema, fibrosis, atelectasis, asthma) divided by the average of normal lung samples 



Pkey 


ExAccn 


UnigenelD 


Unigene Title 


R1 


R2 


400289 


X07820 


Hs.2258 


matrix metalloproteinase 10 (stromelysin 


132.45 


4.00 


400666 






NM_002425:Homo sapiens matrix metallopro 


3.26 


3.22 


401780 






NIvL005557*:Homo sapiens keratin 16 (foca 


26.47 


10.50 


401781 






Target Exon 


10.33 


4.61 


401785 






NM_002275*:Homo sapiens keratin 15 (KRT1 


A i A 

4.13 


2.70 


401994 






Target Exon 


61.84 


47.00 


402075 






ENSP00000251056*:Plasma membrane calcium 


1.00 


1.00 


404996 






Target Exon 


1.00 


1.00 


407839 


AA045144 


Hs.161566 


ESTs 


173.91 


108.00 


408000 


L11690 


Hs.620 


bullous pemphigoid antigen 1 (230/240kD) 


151.17 


8.00 


408522 


AI541214 


Hs.46320 


Small proline-rich protein SPRK [human, 


1.98 


1.24 


410561 


BE540255 


Hs.6994 


Homo sapiens cDNA: FLJ22044 fis, clone H 


10,04 


A Aa 

1.00 


415091 


AL044872 


Hs.77910 


3-hydroxy-3-methylglutaryl-Coenzyme A sy 


1.00 


30.00 


415817 


U88967 


Hs.78867 


protein tyrosine phosphatase, receptor-t 


24.30 


1.00 


416658 


U03272 


Hs.79432 


fibrillin 2 (congenita) contractus! ara 


53.29 


51.00 


417034 


NM_006183 


Hs.80962 


neurotensin 


1.00 


1.00 


417366 


BE1 85289 


Hs.1076 


small proline-rich protein 1B (cornifin) 


8.97 


3.27 


418663 


AK001100 


Hs.41690 


desmocollin 3 


112.17 


19.00 


418678 


NM_001327 


Hs.87225 


cancer/testis antigen 


1.18 


1.10 


419121 


AA374372 


Hs.89626 


parathyroid hormone-like hormone 


1.00 


1.00 


420783 


AI659838 


Hs.99923 


lectin, galactoside-binding, soluble, 7 


3.04 


1.25 


421773 


W69233 


Hs.112457 


ESTs 


1.12 


1.14 


421948 


L42583 


Hs.334309 


keratin 6A 


51.83 


20.25 


421978 


AJ243662 


Hs.110196 


NICE-1 protein 


1.01 


0.91 


422158 


L10343 


Hs.112341 


protease inhibitor 3, skin-derived (SKAL 


2.37 


1.10 


422440 


NM_004812 


Hs.116724 


aldo-keto reductase family 1, member B10 


47.53 


32.00 


423634 


AW959908 


Hs.1690 


heparin-binding growth factor binding pr 


76.02 


1.00 


423725 


AJ403108 


Hs.132127 


hypothetical protein LOC57822 


4.20 


1.00 


423738 


AB002134 


Hs.132195 


airway trypsin-Iike protease 


10.14 


51.00 


424012 


AW368377 


Hs.137569 


tumor protein 63 kDa with strong homolog 


233.42 


68.00 


424046 


AF027866 


Hs.138202 


serine (or cysteine) proteinase inhibito 


1.00 


1.00 


424098 


AF077374 


Hs.1 39322 


small proline-rich protein 3 


137.82 


mm M jm. » 

54,00 


424834 


AK001432 


Hs.1 53408 


Homo sapiens cDNA FLJ 10570 fis, clone NT 


56.19 


12,00 


425650 


NM 001944 


Hs.1925 


desmoglein 3 (pemphigus vulgaris antigen 


33.45 


1.00 


427099 


AB032953 


Hs.173560 


odd Oz/ten-m homolog 2 (Drosophila, mous 


4.24 


17.00 


427335 


AA448542 


Hs.251677 


G antigen 7B 


51.83 


4.00 


428182 


BE386042 


Hs.293317 


ESTs, Weakly similar to GGC1J-1UMAN G ANT 


1.00 


1.00 


428645 


AA431400 


Hs.98729 


ESTs, Weakly similar to 201 7205A dihydro 


1.00 


16.00 


428748 


AW593206 


Hs.98785 


Ksp37 protein 


1.00 


87.00 


429259 


AA420450 


Hs.292911 


ESTs, Highly similar to S60712 band-6-pr 


2.01 


1.18 


429538 


BE182592 


Hs.1 1261 


small proline-rich protein 2A 


4.43 


2.90 


429903 


AL134197 


Hs.93597 


cyclin-dependent kinase 5, regulatory su 


11.80 


1.00 


430486 


BE062109 


Hs.241551 


chloride channel, calcium activated, fam 


12.28 


41.00 


430890 


X54232 


Hs.2699 


glypican 1 


1.58 


1.40 


431009 


BE149762 


Hs.48956 


gap junction protein, beta 6 (connexin 3 


60.25 


28.00 


431846 


BE019924 


Hs.271580 


uroplakin 1B 


4.49 


2.51 


433091 


Y12642 


Hs.3185 


lymphocyte antigen 6 complex, locus D 


1.20 


1.09 


434360 


AW015415 


Hs.1 27780 


ESTs 


40.98 


27.00 


434880 


U02388 


Hs.1 01 


cytochrome P450, subfamily IVF, polypept 


1.00 


1.00 


435505 


AF200492 


Hs.211238 


interleukin-1 homolog 1 


1.00 


38.00 


435793 


AB037734 


Hs.4993 


KIAA1313 protein 


23.68 


42.00 


436511 


AA721252 


Hs.291502 


ESTs 


16.76 


14.00 


438403 


AA806607 


Hs.292206 


ESTs 


1.00 


1.00 


439285 


AL133916 




hypothetical protein FLJ20093 


46.23 


139.00 


439606 


W79123 


Hs.58561 


G protein-coupled receptor 87 


33.61 


1.00 


439670 


AF088076 


Hs.59507 


ESTs, Weakly similar to AC004858 3 U1 sm 


1.00 


1.00 


439706 


AW872527 


Hs.59761 


ESTs, Weakly similar to DAP INHUMAN DEATH 


86.55 


11.00 


440325 


NM 003812 


Hs.7164 


a disintegrin and metalloproteinase doma 


62.88 


147.00 


441525 


AW241867 


Hs.1 27728 


ESTs 


1.53 


1.42 


443162 


T49951 


Hs.9029 


DKFZP434G032 protein 


31.11 


38.00 


444378 


R41339 


Hs.12569 


ESTs 


1.00 


1.00 
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1.26 




MrUO IHul 


He 97QRR9 


Rh tvDe C alvcoorotein 


1.55 


AA7f\7ft 
44 f \Jf a 




He QQ14. 


ESTs 


47.24 


24.00 






ni). i voce. 


Homo sapiens. Similar to RIKEN cDNA 2010 


28.63 


1.00 




Af 004Z 


Hq IRQ 


alcohol dehvdroaenase 7 (class IV). mu o 


1.00 


1.00 


449101 


AA205847 


Hs 23016 


G Drotein-couoled receptor 


2.58 


27.00 


450832 


AW970602 


Hs.1 05421 


ESTs 


25.17 


36.00 


452240 


A1591147 


Hs.61232 


ESTs 


13.42 


1.00 


453317 


NM.002277 


Hs.41696 


keratin, hair, acidic.1 


1.19 


1.27 


453830 


AA534296 


Hs.20953 


ESTs 


24.92 


25.00 


454098 


W27953 


Hs.292911 


ESTs, Highly similar to S60712 band-6-pr 


1.26 


1.11 


455601 


A1368680 


Hs.816 


SRY (sex determining region Y)-box 2 


206.11 


1.00 
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TABLE 12B 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey 
439285 



CAT Number 
47065.1 



Accession 

AL133916 N79113AFQ86101 N76721 AW950828AA364013 AW955684 AI346341 AI867454 N54784 Ai 655270 AI421 279 AW0 14882 
AA775552 N62351 N59253 AA626243 AI341 407 BE175639 AA456968 AI35891 8 AA457077 



TABLE 12C 

Pkey: 
Ref: 

Strand: 
Nt_position: 



Unique number corresponding to an Eos probeset 

Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gi) numbers. "Dunham I. et al." refers to the publication entitled 'The DNA 
sequence of human chromosome 22." Dunham I. et al„ Nature (1999) 402:489-495. 
Indicates DNA strand from which exons were predicted, 
indicates nucleotide positions of predicted exons. 

NLposition 

17982-18115,20297-20456 

28397-28617,28920-29045,29135-29296,29411-29567,29705-29787,30224-30573 
83215-83435,83531-83656,83740-83901,84237-84393,84955-85037,86290-86814 
165776-165996,166189-166314,166408-166569,167112-167268,167387-167469,168634-168942 
42904-43124,43211-43336,44607-44763,45199-45281,46337-46732 
121907-122035,122804-122921,124019-124161,124455-124610,125672-126076 
37999-38145,38652-38998,39727-39872,40557-40674,42351-42450 



Pkey 


Ref 


Strand 


400666 


8118496 


Plus 


401780 


7249190 


Minus 


401781 


7249190 


Minus 


401785 


7249190 


Minus 


401994 


4153858 


Minus 


402075 


8117407 


Plus 


404996 


6007890 


Plus 
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TABLE 13A: Genes Distinguishing Non-Malignant Lung Disease from Lung Tumors and Normal lung 
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Table 13A shows about 23 genes upregulated in non-malignant lung disease relative to lung tumors and normal lung. These genes were selected from about 59680 probesets on 
the Eos/Affymetrix Hu03 Genechip array. 

Table 13B show the accession numbers for those Pkey's lacking UnigenelD's for table 13A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 13C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 13A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: 
ExAccn: 
UnigenelD: 
Unigene Title: 
R1: 

R2: 



Unique Eos probeset identifier number 

Exemplar Accession number, Genbank accession number 

Unigene number 

Unigene gene title 

Average of lung tumors {including squamous cell carcinomas, adenocarcinomas, small cell carcinomas, granulomatous and carcinoid tumors) divided by the 
average of normal lung samples 

Average of non-malignant lung disease samples (including bronchitis, emphysema, fibrosis, atelectasis, asthma) divided by the average of normal lung samples 



Pkey 


ExAccn 


UnigenelD 


Unigene Title 


R1 


R2 


408562 


AI436323 


Hs.31141 


Homo sapiens mRNA for KIAA1568 protein, 


1.00 


230.00 


409031 


AA376836 


Hs.76728 


ESTs 


1.00 


128.00 


412372 


R65998 


Hs.285243 


hypothetical protein FU22029 


1.00 


173.00 


415910 


U20350 


Hs.78913 


chemokine (C-X3-C) receptor 1 


1.00 


145.00 


417511 


AL049176 


Hs.82223 


chordin-like 


1.00 


179.00 


418819 


AA228776 


Hs.191721 


ESTs 


1.00 


140.00 


422060 


R20893 


Hs.325823 


ESTs, Moderately similar to ALU5.HUMAN A 


1.00 


156.00 


424585 


AA464840 


Hs.131987 


ESTs 


1.00 


167.00 


426753 


T89832 


Hs.170278 


ESTs 


1.00 


141.00 


429496 


AA453800 


Hs.1 92793 


ESTs 


1.00 


138.00 


430719 


AA488988 


Hs.293796 


ESTs 


1.00 


133.00 


431089 


BE041395 




ESTs, Weakly similar to unknown protein 


23.32 


941.00 


431385 


BE1 78536 


Hs.11090 


membrane-spanning 4-domains, subfamily A 


1.00 


157.00 


431728 


NM.007351 


Hs.268107 


multimerin 


1.00 


157.00 


436532 


AA721522 




gb:nv54h12.r1 NCLCGAP_Ew1 Homo sapiens 


1.00 


218.00 


437960 


AI669586 


Hs.222194 


ESTs 


1.00 


147.00 


438202 


AW1 69287 


Hs.22588 


ESTs 


1.00 


141.00 


441499 


AW298235 


Hs.101689 


ESTs 


1.00 


167.00 


444513 


AL120214 


Hs.7117 


glutamate receptor, ionotropic, AMPA 1 


1.00 


151.00 


448253 


H25899 


Hs.201591 


ESTs 


1.00 


141.00 


453636 


R67837 


Hs. 169872 


ESTs 


1.00 


116.00 


458332 


AI000341 


Hs.220491 


ESTs 


1.00 


192.00 


459587 


AA031956 




gb:zk1 5e04.s1 Soares _pregnanLuterus_NbH 


1.00 


154.00 



TABLE 13B 

Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 

Accession: Genbank accession numbers 

Pkey CAT Number Accession 

431089 327825 1 B E04 1 395 AA49 1826 AA62 1946 AA7 15980 AA6661 02 

436532 421802 1 AA721522 AW975443 T93070 



TABLE 13C 



Pkey: Unique number corresponding to an Eos probeset 

Ref: Sequence source. The 7 digit numbers in this column are Genbank identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled "The DNA 

sequence of human chromosome 22." Dunham I. et al., Nature (1999) 402:489-495. 

Strand: Indicates DNA strand from which exons were predicted. 

NLposition: Indicates nucleotide positions of predicted exons. 

Pkey Ref Strand NLposition 

402075 8117407 Plus 121907-122035,122804-122921,124019-124161,124455-124610,125672-126076 
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TABLE 14A: Preferred Utility and Subcellular Localization for Potential Lung Disease Targets 

Table HA shows the subcellular localization and preferred utility for the genes appearing in Tables 9A and 10A. mAb symbolizes monoclonal antibody, diag symbolizes 
diagnostic, s.m. symbolizes small molecule, and CTL symbolizes cytotoxic lymphocytic ligand. These genes were selected from 59680 probesets on the Eos/Affymetrix Hu03 
Genechip array. 

Table 14B show the accession numbers for those Pkey's lacking UnigenelD's for table 14A. For each probeset we have listed the gene cluster number from which the 
ol/gontfc/eotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were duslered based on sequence 
similarity using Clustering and Alignment Tools (DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 14C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 14A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Pkey: Unique Eos probeset identifier number 
ExAccn: Exemplar Accession number, Genbank accession number 
UnlgenelD: Unigene number 
Unigene Title: Unigene gene title 
Pref. Utility: Preferred Utility 



PrpH I c\c; 


Predicted subcellular localization 






Pkpv 


ExAccn 


UnigenelD 


Unigene Title 


Pref Utility 


Pred. Loc 


400289 


X07820 


Hs.2258 


matrix metailoproteinase 10 (stromelysin 


mAb & diag & s.m. 


extracellular 




M242758 


Hs.79136 


UV-1 protein, estrogen regulated 


mAb 


olasma membrane 

I \^ w PI I fmA T 1 * W * p P wmmT 9 mmm P P ymf 


40907*5 






ENSP00000251056*:P.asma membrane calcium mAb & diag 


secreted 


40781 1 


AW190902 


Hs.40098 


cvsteine knot suDerfamilv 1. BMP antaaon 


diag 


secreted 


408243 


Y00787 


Hs.624 


interieukin 8 


diag 


secreted 


40R7QO 


AW580227 


Hs.47860 


neurotroohic tvrosine kinase receDtor. 


mAb & s.m. 


Dlasma membrane 

mmf P \^ Sm* • T ■ k*4 III \m* 'PI ™" ■ 1 1 


408908 


BE296227 


Hs.250822 


serine/threonine kinase 15 


s.m. 


cvtoolasm 


40Q041 


AB033025 


Hs.50081 


HvDothetical Drotein XP 051860 (KIAA1 19 


CTL & diaq 


secreted 


409103 


AF251237 


Hs.1 12208 


XAGE-1 Drotein 


CTL 


nuclear 


409420 


Z15008 


Hs.54451 


laminin namima 2 (nlcein HOOkD^ kalini 


diaa 


secreted 


409832 


W74001 


Hs.55279 


serine (or cysteine} Drotein as e inhibito 


diaa 


secreted 

mat wp 


4097*57 


NM 001898 


Hs.123114 


nystatin SN 


diaa 


extracellular 


409893 


AW247090 


Hs.57101 


minichromosome maintenance deficient IS. 


CTL 


nuclear 




AW103364 


Hs.727 


inhihin beta A factivin A activin AB a 


diaa 

\4 i«y 


extracellular 


410001 


AB041036 


Hs.57771 


kallikrein 1 1 

INCH H IM V> U 1 1 1 


diaa 


extracellular 


41 0407 


X66839 


Hs.63287 


carbonic anhvdrase IX 


mAb & s.m. 


dasma membrane 


41 041 R 


D31382 


Hs.63325 


transmembrane protease, serine 4 


mAb & diaq & s.m. 


Dlasma membrane 

UIWWl 1 1 Vp<* 1 1 IWI 1 IVI *»* ' IV 


419140 


M219691 


Hs.73625 
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mitochondrial 


419216 


AU076718 


Hs.1 64021 


small inducible cytokine subfamily B (Cy 


diag 


secreted 


419235 


AW470411 


Hs.288433 


neurotrimin 


mAb & diag 


plasma membrane 


419452 


U33635 


Hs.90572 


PTK7 protein tyrosine kinase 7 


mAb & s.m. 
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cartilage oltgomeric matrix protein (pse 


diag 
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heparin-binding growth factor binding pr 


diag 




423673 


BE003054 


Hs.1695 


matrix metailoproteinase 12 (macrophage 


mAb & diag & s.m. 
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s.m. 
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ns. I ooz^o 


sianniocaicin z 


mAh A Hian 
illAU Ot uidy 


cpprpfpH 


42b4<if 


Mobbby 
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CAU dUCIIUIal 


4zo/4o 


AWbyozOb 


Up C1Q70C 

HS.ytJ/85 


□idg 


428758 


A A/QQQQQ 

AA4oJyoo 


Up QQcno 
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|Jldol Mall »Ci l iui al ic 
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A A CC0~? 

445537 


A J 245b /I 


Up 4 OOil A 

HS. 12844 


tor-iiKe-domain, multiple d 


mAh A rllo/T 

mAD ot uisg 


cpprplpri 
OCOICLCU 


44bbiy 


Al \r\7RRA1 

AUO/bb4o 


Ue OIQ 

HS.313 


#%nn r n In rl nhnnnhnn rf\ fa m 1 ( C\C TO A nAriTin 

secreted pnospnoprotein i ^osieoponun, 


HI an 
Uldg 


cpprplpri 


44b921 


ABOIzl 1o 


Up 4 G CI Pi 

HS.lbbdO 


small mouciDie cytoKine suDiamny a \\sy 


uiag 


pylrappllnlar 

CAU dOCJIUIdl 


447033 


AI35/412 


Up 4) C7CA1 

HS.15/b01 


CCTe 

to IS 


PTi & Hi an 

\j 1 L & uldg 


cpptpIpH 

OCUICICU 


AA71A') 
44/04<£ 


AM QO.OGB 

Anyyzbo 


Ue -1QOOO 

HS.193^Z 


nomo sapiens, oimuar to kiivcin cuima zu iu 


CTI 

Vj 1 L 


nlacma mpmhranp 

UldOllld 1 1 ICI 1 IUI dl IC 


/HQ 0/1 "3 

44oZ4o 


Awoby/ /i 


Ue COCOA 


integnn, oeta o 


mAh ft c m _ 

IllAU Ot o.lll. 


^ AQQ A A 

448844 


AI5815iy 


Up ^ 77H GA 

HS.1 //1b4 


COTe 

tots 


mAh P. c m 
IIIAU Ot 5. III. 




AACi(\A0 

449048 


Z45051 


Up oonon 
HS.22y20 


similar to obo40i icattiej giucose inouc 


mAh 
mAD 


nlacma mpmhrane 

{Jldollld HlclllUIdllc 


449722 


bbzo00/4 


Up ooncn 
HS.239bO 


cyciin til 


e m 

s.m. 


pi/In nl a c m 
uyiUUIdolll 


450001 


MM f\f\4r\AA 

NM„00 1044 


Up ACiG 

HS.406 


nntiiln n n rw\ n r fn mi f 1 f £ /flAI IfAlKOnrmUlA 

solute carrier tamiiy b (neurotransmitte 


m Ah P p rn 

mAD ot s.m. 


nlacma mpmhranp 
pidolild UlclllUidHc 


450375 


a AnnQC>i7 
AA00954/ 




n nJ7r«in^nnrin n n *-J mnlnltnnt*ntni ri nr*A A?AmA 

a disintegnn and metaiioproteinase aoma 


mAh SL Hian )?> c m 
mAD Ot Uldg Ot o.lll. 


nlacma mpmhranp 
DldoHld HlclllUIdllc 


450701 


H3yyb0 


Up OOOjIC7 

HS.2884b7 


nypotneticai protein Ar_uyoioi leucine- 


mAh SL Wion 
mAD Ot Uldg 


nlacma mpmhranp 
pidolild HlclllUIdllc 


a ennoo 

450983 


A A Of\C3QA 

AA305J84 


Up 1C7i(n 

Hs. 25740 


tKUl (o. cerevisiaej-iiKe 


diag 


ScCIclCU 


HO 1 OuO 


74^Q4R 


Ue ^9fi444 


nartilanp acirlin nrntpin 1 


mAb & diao 


Dlasma membrane 

| M w i i 1 1^4 ill wi i ( wi 


452281 


T93500 


Hs.28792 


Homo sapiens cDNA FLJ11041 fis, clone PL 


diag 




452401 


NM_007115 


Hs.29352 


tumor necrosis factor, alpha-induced pro 


diag 


extracellular 


452747 


BE153855 


Hs.61460 


Ig superfamily receptor LNIR 


mAb 


plasma membrane 


452838 


U65011 
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preferentially expressed antigen in mela 


CTL 


nuclear 


453968 


AA847843 


Hs.62711 


High mobility group (nonhistone chromoso 


CTL & s.m. 


nuclear 


457489 


AI693815 


Hs.127179 


cryptic gene 


diag 


secreted 



TABLE 14B 



Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 

Pkey CAT Number Accession 



182 



WO 02/086443 

414883 15024 J 



450375 83327J 



PCT/US02/12476 

AA926960 M926959 W76521 W24270 W21526 AA037172 BE267636 H83186 AA469909 N86396 AA001348 BE535736 AA081745 BE566245 
AA082436 H72525 H77575 N49786 W80565 H78746 BE569085 W04339 R981 27 T55938 BE279271 AW960304 T29812 AA476873 BE297387 
AA292753 AA177048 NM_001826 X54941 BE314366 AA908783 A1719075 BE270172 BE269819 M889955 AI204630 W25243 AI935150 
AA872039 W72395 T99630 AI422691 H98460 N31428 BE255916 H03265 AI857576 M776920 AA910644 AA459522 AA293140 AW514667 
R75953 AW662396 AA662522 AI865147 A1423153 AW262230 AA584410 AA583187 AW024595 AW069734 AI828996 M282997 AA876046 
AW61 3002 AA527373 AW972459 AI831360 AA621 337 AA1 00926 AA77241 8 M594628 AI033892 W95096 AI034317 M398727 A1085031 
N95210 A1459432 A1041437 AA932124 AA627684 AA935829 AI004827 A1423513 AI094597 H42079 R54703 AI630359 AA617681 M978045 
AA643280 W44561 AI991988 AI537692 AI090262 AA740817 AI312104 AI91 1822 AA416871 A1185409 AA129784 AA701623 AI075239 
Al 139549 AA633648 AI339996 AI336880 M399239 AI078708 AI085351 AI362835 AI34661 8 Al 146955 AI989380 AI348243 N92892 M765850 
AI494230 AI278887 AA962596 AI492600 W80435 AA001979 R97424 Al 1 2901 5 N24127 AA1 57451 AA235549 AA459292 AA0371 14 AA129785 
A1494211 AW059601 AW886710 R92790 N59755 A136112B AW589407 H47725 H97534 H48076 H48450T99631 AW300758 H03431 R76789 
AA954344 H77576 R96823 AI457100 N92845 N49682 H42038 BE220698 BE220715 H99552 M701624 N74173 R54704 H79520 H72923 
H03266 BE261 919 AA769633 AA48031 0 AA507454 AA910586 AI203723 AW1 04725 W2561 1 W25071 T88980 H0351 3 T77589 R991 56 
W95095 R97470 AA702275 T77551 AA91 1 952 H82956 N83673 M283672 

AA009647 AA1 31254 AA374293 AW954405 H0441 0 AW606284 AA151166 BE1 57467 BE1 57601 H04384 W46291 AW663674 H04021 H01 532 
AA190993 H03231 H59605 H01642 AA852876 AA1 13758 AA626915 AA746952 AI161014 AA099554 R69067 



TABLE 14C 



Pkey: 
Ref: 

Strand: 
Imposition: 

Pkey 

402075 



Unique number corresponding to an Eos probeset 

Sequence source. The 7 digit numbers in this column are Genbank identifier (GI) numbers. "Dunham I. et a)." refers to the publication entitled "The DNA 
sequence of human chromosome 22." Dunham I. et al., Nature (1999) 402:489-495. 
Indicates DNA strand from which exons were predicted. 
Indicates nucleotide positions of predicted exons. 



Ref Strand 
8117407 Plus 



NLposition 

121907-122035,122804-122921,124019-124161,124455-124610,125672-126076 
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TABLE 15A: Information for all sequences in Table 16 

Table 15A shows the Seq ID No, Pkey, ExAccn, UnigenelD, and Unigene Title for all of the sequences in Table 16. 

Table 15B show the accession numbers for those Pkey's lacking UnigenelD's for table 15A. For each probeset we have listed the gene cluster number from which the 
oligonucleotides were designed. Gene clusters were compiled using sequences derived from Genbank ESTs and mRNAs. These sequences were clustered based on sequence 
similarity using Clustering and Alignment Tools {DoubleTwist, Oakland California). The Genbank accession numbers for sequences comprising each cluster are listed in the 
"Accession" column. 

Table 15C show the genomic positioning for those Pkey's lacking Unigene ID's and accession numbers in table 15A. For each predicted exon, we have listed the genomic 
sequence source used for prediction. Nucleotide locations of each predicted exon are also listed. 



Seq ID No: Sequence ID number 

Pkey: Unique Eos probeset identifier number 

ExAccn: Exemplar Accession number, Genbank accession number 

UnigenelD: Unigene number 

Unigene Title: Unigene gene title 



Seq ID No: 



Seq ID No: 1 & 2 
Seq ID No: 3 &4 
Seq ID No: 5 & 6 
Seq ID No: 7 & 8 
Seq ID No: 9 & 10 
Seq ID No: 11 & 12 
Seq ID No: 13 & 14 
Seq ID No: 15 & 16 
Seq ID No: 17 & 18 
Seq ID No: 19&20 
Seq ID No: 21 & 22 
Seq ID No: 23 & 24 
Seq ID No: 26 & 26 
Seq ID No: 27 & 28 
Seq ID No: 29 & 30 
Seq ID No: 31 & 32 
Seq ID No: 33 & 34 
Seq ID No: 35 & 36 
Seq !D No: 37 & 38 
Seq ID No: 39 & 40 
Seq ID No: 41 & 42 
Seq ID No: 43 & 44 
Seq ID No: 45 & 46 
Seq ID No: 47 & 48 
Seq ID No: 49 
Seq ID No: 50 & 51 
Seq ID No: 52 & 53 
Seq ID No: 54 & 55 
Seq ID No: 56 & 57 
Seq ID No: 58 & 59 
Seq ID No: 60 & 61 
Seq ID No: 62 & 63 
Seq ID No: 64 & 65 
Seq ID No: 66 & 67 
Seq ID No: 68 & 69 
Seq ID No: 70 & 71 
Seq ID No: 72&73 
Seq ID No: 74 & 75 
Seq ID No: 76&77 
Seq ID No: 78 & 79 
Seq ID No: 80 & 81 
Seq ID No: 82 & 83 
Seq ID No: 84 & 85 
Seq ID No: 86 & 87 
Seq ID No: 88 & 89 
Seq ID No: 90 & 91 
Seq ID No: 92 & 93 
Seq ID No: 94 & 95 
Seq ID No: 96 & 97 
Seq ID No: 98 & 99 
Seq ID No: 1 00 & 101 
Seq ID No: 102 & 103 
Seq ID No: 104 & 105 
Seq ID No: 106 & 107 
Seq ID No: 108 & 109 
Seq ID No: 110& 111 
Seq ID No: 112& 113 
Seq ID No: 1 14 & 115 
Seq ID No: 116 
Seq ID No: 117 & 118 
Seq ID No: 119 & 120 
Seq ID No: 121 & 122 
Seq ID No: 123 & 124 
Seq ID No: 125 & 126 



Pkey 


ExAccn 


UnigenelD 


Unigene Title 


410407 


X66839 


Hs.63287 


carbonic anhydrase IX 


412719 


■lib t r~ A /> A 

AW016610 


Hs.816 


ESTs 


A A _ mm J — . A 

417034 


NM_006183 


Hs.80962 


neurotensin 


430486 


BE062109 


11 1 A A CCA 

Hs.241551 


chloride channel, calcium activated, tarn 


407788 


BE514982 


Hs.38y91 


biuu caicium-Dinding protein 


407788 


W—A A— A A f-L f\ *m, 

BE514982 


Hs.38991 


Si 00 calcium-binding protein A2 


A fm m A «h» 

407788 


i*m »~ k~* a innn 

BE514982 


Hs.38991 


S 100 calcium-binding protein Ac 


407788 


PX A A t*\ AA 

BE514982 


t t onr>A j 

Hs.38991 


S100 calcium-binding protein A2 


m *m. mm mm mm mm 

439285 


AL133916 




hypothetical protein rU2Uuyo 


413753 


U 17760 


Hs.75517 


laminin, beta 3 (nicem {125kD), kalinm 


120486 


A 1 A | A A*m »*m a**, m-A wm 

AW368377 


Hs. 137569 


tumor protein 63 kDa with strong nomoiog 


425650 1 


A t A A £\ /-\ i A J 1 

NM_001944 


Hs.1925 


desmoglein 3 (pemphigus vulgaris antigen 


412140 


AA219691 


Hs.73625 


RAB6 interacting, kmesin-iiKe (raDKines 


423673 


BE003054 


Hs.1695 


_^>. aIJi. nn A(>^llAP\i'islAiirt AAiA 4 O /m^A Ortrt 

matnx metaiioprotemase \i (macropnage 


452838 


U65011 


Hs.30743 


preferentially expressed antigen in meia 


A A S\ S\ A A 

418663 


AK001100 


Hs.41690 


desmocollin 3 


418663 


AK001100 


Hs.41690 


desmocollin o 


409632 


I A 1*1? A f\ (\ A 

W74001 


Hs.55^79 


serine (or cysteine; proteinase inniDito 


429610 


a r\ a~a—\ j aat 

AB024937 


Hs. 21 1092 


LUNX protein; rLUiNL* (palate lung and nas 


406690 


M29540 


Hs. 220529 


carcmoemoryonic antigen-reiatea cen aa 


431846 


BE019924 


Hs. 271 580 


• k w* Am. mm t A*m\ t \ aaa A 1 1 

uroplakin IB 


418830 


t~* ff* AWk A MM f* A 

BE513731 


Hs. 88959 


hypothetical protein MbL4oio 


424098 


AF077374 


Hs. 139322 


small proline-nch protein o 


443648 


AI085377 


11 A A IP fl r\ 

Hs.143610 


ESTs 


311034 


BE567130 


Hs.311389 


ESTs, Highly similar to NKbu_nUMAN nmj*:- 


408522 


a i <~" m A t~\ A A 

AI541214 


Hs.46320 


Small proline-nch protein brKK. [human, 


a r-\ y— , J mm r*\ 

422158 


L10343 


Hs. 112341 


protease inhibitor 3, skin-derived (oi\al 


435505 


a ^— m* a\ m\ m a-\ f\ 

AF200492 


Hs.211238 


interleukin-1 homolog 1 


■ J\ M mm. AAA, AAA, 

417366 


BE185289 


Hs.1076 


small proline-nch protein IB (cormrin) 


431958 


X63629 


Hs.2877 


cadhenn 3, type 1, P-cadhenn (placenta 


A\ A A r\. #*> /"% 

441020 


W79283 


i i nrn^A 

Hs.35962 


ESTs 


423217 


NM_000094 


11 i A JA 

Hs.1640 


collagen, type VII, alpha 1 (epidermolys 


429538 


BE182592 


Hs. 11261 


small proline-rich protein 2A 


448733 


NM_005629 


Hs. 187958 


solute carrier tamiiy b (neurotransmitte 


A J A a— A m—m A 

444371 


BE540274 


Hs.239 


forkhead box Ml 


444371 


BE540274 


• i n nn 

Hs.239 


forkhead box W 


444371 


BE540274 


Hs.239 


forkhead box Ml 


A mm aJAa A S~\ in 

422168 


AA586894 


Hs. 112408 


S100 calcium-binding protein A/ (psorias 


422168 


AA586894 


HS.n^4Uo 


oiuu caicium-Dinaing protein a/ ipsonas 


429259 


AA420450 


Hs.29291 1 


Piakophilin 


426440 


BE382756 


Hs.169902 


solute carrier family 2 (facilitated glu 


437044 


AL035864 


Hs.69517 


differentially expressed in Fanconi's an 


423662 


AK001035 


Hs.1 30881 


B-cell CLUIymphoma 11A (zinc finger pro 


428484 


AF1 04032 


Hs.184601 


solute carrier family 7 (cationic amino 


429211 


AF052693 


Hs.198249 


gap junction protein, beta 5 (connexin 3 


417389 


BE260964 


Hs.82045 


midkine {neurite growth-promoting factor 


423634 


AW959908 


Hs.1690 


heparin-binding growth factor binding pr 


417515 


L24203 


Hs.82237 


ataxia-telangiectasia group D-associated 


441362 


BE614410 


Hs.23044 


RAD51 (S. cerevisiae) homolog (E coli Re 


425322 


U63630 


Hs.1 55637 


protein kinase, DNA-activated, catalytic 


449003 


X76342 


Hs.389 


alcohol dehydrogenase 7 (class IV), mu o 


431009 


BE149762 


Hs.48956 


gap junction protein, beta 6 (connexin 3 


409103 


AF251237 


Hs.1 12208 


XAGE-1 protein 


417542 


J04129 


Hs.82269 


progestagen-associated endometrial prote 


428471 


X57348 


Hs.1 84510 


stratifin 


418004 


U37519 


Hs.87539 


aldehyde dehydrogenase 3 family, member 


414761 


AU077228 


Hs.77256 


enhancer of zeste (Drosophila) homolog 2 


418203 


X54942 


Hs.83758 


CDG28 protein kinase 2 


447343 


AA256641 


Hs.236894 


ESTs, Highly similar to S02392 alpha-2-m 


437016 


AU076916 


Hs.5398 


guanine monphosphate synthetase 


449230 


BE613348 


Hs.211579 


melanoma cell adhesion molecule 


446989 


AK001898 


Hs.1 6740 


hypothetical protein FLJ11036 


457819 


AA057484 


Hs.35406 


ESTs, Highly similar to unnamed protein 


424687 


J05070 


Hs.151738 


matrix metalloproteinase 9 (gelatinase B 
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Seq ID No: 127 & 128 414430 

SeqlDNo:129&130 418462 

SeqlDNo:131&132 100668 

SeqlDNo:133& 134 458933 

SeqIDNo: 135 & 136 418478 

SeqlDNo:137&138 418478 

SeqIDNo: 139 & 140 418478 

SeqIDNo: 141 & 142 418478 

SeqlDNo:143&144 446269 

Seq ID No: 145 & 146 422765 

Seq ID No: 147 & 148 436481 

SeqlDNo:149& 150 440325 

SeqIDNo: 151 & 152 439606 

Seq ID No: 153 & 154 453884 

Seq ID No: 155 & 156 453884 

Seq ID No: 157 & 158 453884 

Seq ID No: 159 & 160 453884 

Seq ID No: 161 & 162 404877 

Seq ID No: 163 & 164 413129 

Seq ID No: 165 & 166 413281 

Seq )D No: 167 & 168 444781 

Seq ID No: 169 & 170 416819 

Seq ID No: 171 & 172 451320 

Seq ID No: 173 & 174 418543 

Seq ID No: 175 & 176 454034 

Seq ID No: 177 & 178 425397 

Seq ID No: 179 & 180 415817 

Seq ID No: 181 & 182 415817 

Seq ID No: 183 & 184 415817 

Seq ID No: 185 & 186 415817 

Seq ID No: 187 & 188 415817 

Seq ID No: 189 & 190 419121 

Seq ID No: 191 & 192 448993 

Seq ID No: 193 & 194 421817 

Seq ID No: 195 & 196 430393 

Seq ID No: 197 & 198 425057 

Seq ID No: 199 & 200 420462 

Seq ID No: 201 & 202 102963 

Seq ID No: 203 & 204 100576 

Seq ID No: 205 & 206 101175 

Seq ID No: 207 & 208 429038 

Seq ID No: 209 & 210 418678 

Seq ID No: 21 1 & 212 418678 

Seq ID No: 213 & 214 131927 

Seq ID No: 215 & 216 428182 

Seq ID No: 217 & 218 427335 

Seq ID No: 219 & 220 409420 

Seq ID No: 221 & 222 114346 

Seq ID No: 223 & 224 438956 

Seq IDNo: 225 & 226 404440 

Seq ID No: 227 & 228 415669 

Seq ID No: 229 & 230 103312 

Seq ID No: 231 & 232 320843 

Seq ID No: 233 429065 

Seq ID No: 234 & 235 446102 

Seq ID No: 236 & 237 330495 

Seq ID No: 238 413573 

Seq ID No: 239 & 240 428479 

Seq ID No: 241 & 242 428479 

Seq ID No: 243 & 244 332180 

Seq ID No: 245 437915 

Seq ID No: 246 & 247 441553 

Seq ID No: 248 & 249 331692 

Seq ID No: 250 & 251 429413 

Seq ID No: 252 & 253 422283 

Seq ID No: 254 & 255 448357 

Seq ID No: 256 & 257 446292 

Seq ID No: 258 & 259 416209 

Seq ID No: 260 & 261 453922 

Seq ID No: 262 & 263 424046 

Seq ID No: 264 & 265 439223 

Seq ID No: 266 & 267 429228 

Seq ID No: 268 & 269 409757 

Seq ID No: 270 & 271 411089 

Seq ID No: 272 & 273 436511 

Seq ID No: 274 & 275 428969 

Seq ID No: 276 & 277 428969 

Seq ID No: 278 & 279 428969 

Seq ID No: 280 & 281 428969 

Seq ID No: 282 407137 

Seq ID No: 283 & 284 412723 

Seq ID No: 285 & 286 450701 

Seq ID No: 287 & 288 405770 

Seq ID No: 289 & 290 439453 

Seq ID No: 291 & 292 414774 



a m a /> nn A 

Al 346201 


nS./bllo 


BE001596 


Hs.8b2bb 


L05424 


i_i_ 4 cneHn 

Hs.lbablO 


AI638429 


LI- OVC7CQ 

Hs.24763 


U38945 


Hs.1174 


f ton t~\ A t~ 

U38945 


1 1— A AT A 

Hs.1174 


U38945 


1 ». A Al A 

Hs.1174 


U38945 


LI*. A 4 ~7 A 

Hs.1174 


AW263155 


11. A A rrn 

Hs. 14559 


AW409701 


Hs.1578 


AA379597 


Hs.5199 


NMJJ03812 


Hs.7164 


W79123 


u. core* 
HS,5oobl 


AA355925 


HS. 6b lo I 


AA355925 




a a occnoc 

AA355925 




AA355925 


HS.ob^oZ 


AF292100 


Hs.1 04613 


A A O A fi^A 

AA861271 


Hs.222024 


ill i aj A Af\f\ 

NM_0 14400 


LI- 4 4 nrft 

Hs.1 1950 


U77735 


Hs.80205 


AlA IA A rtATn 

AW1 18072 




NM_005329 


nS.obyb^ 


NM_Q00691 


Hs.ofo 


1A A ADO 

J04088 


Li_ <ceo4c 

Hs.1obo4b 


U88967 


1_J_ 7O0C7 

Hs.7ooo/ 


U88967 


LI- *7QQC7 

HsYobo/ 


U88967 


HS.7obo7 


U88967 


MS. /00b/ 


U88967 


U- 7QQC7 

nS./oob/ 


AA374372 


HS.oybzb 


AI471630 


HS.812/ 


A f A A r*r\-t A 

AF1 46074 


Hs.1 08660 


BE1 85030 


HS.241 305 


AA826434 


Hs.1619 


a rftpni a ~f 

AF050147 


Hs.97932 


\jr\r\ Af\ A 

X02404 


| i_ r\-j ACOA 

Hs. 274534 


X00356 


1 1_ 157AC0 
Hs.37058 


U82671 


Hs. 36980 


a 1 nnn r4i 

AL023513 


Hs. 194766 


NM 001327 


Hs.1 67379 


NM 001327 


Hs. 167379 


AJ003112 


Hs.34780 


BE386042 


Hs. 2933 17 


a a a a n r a 0 

AA448542 


Hs.251677 


Z15008 


II— CJl AC*. 

Hs.54451 


A 1 A A"JATA 

AL1 37256 


Hs.1 30489 


W00847 


11. ^ocrice 

Hs.1 35056 


NM_005025 


| 1. 70COrt 

Hs.78589 


\t A AA A 1 

Y 12642 


Hs.31 00 


nrA/>AAOO 

BE069288 


Hs.34744 


AI753247 


Hs.29643 


AW1 68067 


|_1„ ni Tefljl 

nS.317694 


U47924 


HS.71642 


A1733859 


HS.1490by 


Y00272 


it. ooxeco 
Hs.3345b2 


Y00272 


HS.od4bb<l 


AF134160 


L)_ "700*7 


Al 637993 


11. Of\1Q"IO 


AA281219 


Li- <io4nnc 

Hs.lzi/ab 


A ICOO A 0*7 

AI683487 


Ll„ 4 cOHO 


kit 1 f\4 Af\CO 

NM_Q 14058 


HS.201o^ 


AW41 1 307 


Hs.114311 


N201 69 


1 1_ jnonoo 

Hs.108923 


a rn 0 4 a m 

AF081497 


HS.^fbbo^ 


AA236776 


Li . -7nn*7D 

HS.790/8 


AF053306 


1 f_ ne7flQ 

Hs.36708 


A r*AA*7AAA 

AF027866 


Hs. 138202 


a l unnnnnn 

AW238299 


Hs. 250618 


Al 553633 


1 1 «. AAA j| i"7 

Hs. 326447 


1 U j AA^ AAA 

NM_001898 


Hs. 1231 14 


A A J r*p jr J 

AA456454 


Hs.214291 


AA721252 


1 I— AA<I CAA 

Hs.291502 


AF1 20274 


Hs.194689 


AF120274 


Hs.194689 


AF1 20274 


Hs.194bo9 


AF1 20274 


Hs.194689 


T97307 




AA648459 


Hs.335951 


H39960 


Hs.288467 


BE264974 


Hs.6566 


X02419 


Hs.77274 



ubiquitin carboxyl-termtna) esterase L1 
integrin, beta 4 

CD44 antigen (homing function and Indian 

RAN binding protein 1 

cycl in-dependent kinase inhibitor 2A (me 

cyclin-dependent kinase inhibitor 2A (me 

cyclin-dependent kinase inhibitor 2A (me 

cyclin-dependent kinase inhibitor 2A (me 

hypothetical protein FLJ10540 

bacufoviral IAP repeat-containing 5 (sur 

HSPG150 protein similar to ubiquitin-con 

a disintegrin and metal loproteinase doma 

G protein-coupled receptor 87 

KIAA0186 gene product 

KIAA0186 gene product 

KIAA0186 gene product 

KIAA0186 gene product 

NM_005365:Homo sapiens melanoma antigen, 

RP42 homotog 

transcription factor BMAL2 

GPl-anchored metastasis-associated prote 

pim-2 oncogene 

diacylglycerol kinase, zeta (104kD) 
hyaluronan synthase 3 
aldehyde dehydrogenase 3 family, member 
topoisomerase (DNA) li alpha (170kD) 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
parathyroid hormone-like hormone 
KIAA0144 gene product 
ATP-binding cassette, sub-family C (CFTR 
estrogen-responsive B box protein 
achaete-scute complex (Drosophila) homo! 
chondromodulin I precursor 
calcitonin-related polypeptide, beta 
calcitonin/calcitonin-related polypeptid 
melanoma antigen, family A, 2 
seizure related gene 6 (mouse)-like 
cancer/testis antigen (NY-ESO-1) 
cancer/testis antigen (NY-ESO-1) 
doublecortex; lissencephaly, X-lmked (d 
ESTs, Weakly similar to GGC1„HUMAN G ANT 
G antigen 7B 

lamlnin, gamma 2 (nicein (100kD), kalini 
ATPase, aminophospholipid transporter-li 
Human DNA sequence from clone RP5-850E9 
NM_021048:Homo sapiens melanoma antigen, 
serine (or cysteine) proteinase inhibito 
lysosomal 

Homo sapiens mRNA; cDNA DKFZp547C136 (fr 
Homo sapiens cDNA FLJ13103 fis, clone NT 
ESTs 

guanine nucleotide binding protein (G pr 
ESTs 

cell division cycle 2, G1 to S and G2 to 
cell division cycle 2, G1 to S and G2 to 
claudin 1 

Homo sapiens clone N11 NTera2D1 teratoca 
ESTs 

wingless-type MMTV integration site fami 
DESC1 protein 

CDC45 (cell division cycle 45, S.cerevis 
RAB38, member RAS oncogene family 
Rh type C glycoprotein 
MAD2 (mitotic arrest deficient, yeast, h 
budding uninhibited by benzimidazoles 1 
serine (or cysteine) proteinase inhibito 
UL1 6 binding protein 2 
ESTs 

cystatin SN 

cell division cycle 2-like 1 (PITSLRE pr 

ESTs 

artemin 

artemin 

artemin 

artemin 

gb:ye53h05.s1 Soares fetal liver spleen 
hypothetical protein AF301 222 
hypothetical protein XPJJ98151 (leucine- 
NM_002362:Homo sapiens melanoma antigen, 
thyroid hormone receptor interactor 13 
plasminogen activator, urokinase 



185 



WO 02/086443 



Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 



Seq 
Seq 
Seq 
Seq 



ID No: 
ID No: 
ID No: 
ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
ID No: 
ID No: 
ID No: 
ID No: 
ID No: 
ID No: 
ID No: 
ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 
Seq ID No: 



Seq 
Seq 
Seq 
Seq 
Seq 
Seq 
Seq 
Seq 



293 & 294 
295 & 296 
297 & 298 
299 & 300 
301 & 302 
303 & 304 
305 & 306 
307 & 308 
309 

310 & 311 
312 & 313 
314 & 315 
316 & 317 
318 & 319 
320 & 321 
322 & 323 
324 & 325 
326 & 327 
328 & 329 
330 & 331 
332 & 333 
334 & 335 
336 & 337 
338 & 339 
340 & 341 
342 & 343 
344 & 345 
346 & 347 
348 & 349 
350 & 351 
3524 353 
354 & 355 
356 & 357 
358 & 359 
360 & 361 
362 & 363 
364 & 365 
366 & 367 
368 & 369 
370 & 371 
372 & 373 
374 & 375 
376 & 377 
378 & 379 
380 & 381 
382 & 383 
384 & 385 
386 & 387 
388 & 389 
390 & 391 
392 & 393 
394 & 395 
396 & 397 
398 & 399 
400 & 401 
402 & 403 
404 & 405 
406 & 407 
408 & 409 
410 & 411 
412 & 413 
414 & 415 
416 & 417 
418 & 419 
420 & 421 
422 & 423 
424 & 425 
426 & 427 
428 & 429 
430 & 431 
432 & 433 
434 & 435 
436 & 437 
438 & 439 
440 & 441 
442 & 443 
444 & 445 
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Hs.293815 


A a A on n 

134299 


A 1 At CO A A OA 

AW580939 


Hs.97199 


A A at 4 A 

41 2719 


A t A fA4 A A 4 A 

AW016610 


1 1 A D4 C 

HS.816 


A AA4 j~ f") 

422158 


1 4 A A 4 A 

L10343 


i i. i J no 4 4 
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1 |_ inn/In 
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419121 
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409459 


r\AA A AT 
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Hs.54481 
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330493 
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HS.82772 
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A lOVO'i AA 
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HS. 252587 
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HS.102 


A A 4 A A 4 

431221 


A A 4 4 AA4 C 
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A A 4 p^P 

431565 


Ar-4 i?4 Aif\ 
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A A 4 rAr 

431565 


A r* 4 C A A "7 A 

AF161470 


HS.2b0622 


a o AO r~ A 

132354 


nr-<n i-a a a 

BE1 85289 


Hs.1076 
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424441 


v/4 4 OCA 
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11—4 J*7An*7 
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103768 
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1 1—. AflAAAA 

Hs.296398 


A A -yr A f\ 

417512 


V/TA C O 4 

X76534 


HS.82226 


A A r* A A 

425266 


1 AA ATT 

J 00 077 


Hs.1 55421 


J A j rnn 

424503 


fc.ll A AAA AAC 

NM_002205 


Hs.149609 


A A A AO A 

400289 


X07820 


HS.2258 


A 4 OA AT 

418007 


A AA OCA A 

M13509 


HS. 83169 


A 4 A A A"T 

418007 


M13509 


HS.83169 


A 4 min 

418738 


A I AIOOOCOO 

AW388633 


HS,bbo2 


A 4 f*4 AO 

415138 


C18356 


HS.295944 


A 4 ArAP 

418506 


AA084248 


Hs.8ojo9 


423961 


D13666 


HS.1obd4o 


4 4 4 A 4 A 

414812 


V7ATCC 

X72755 


Hs.773b7 


A A T 4 O A 

417433 


r»r*ATAAAA 

BE270266 


• )_ Q04 OO 

Hs.82126 


A 4 ■» A O A 

417433 


io r* at A a a a 

BE270266 


i}— 04 00 

HS.82128 


A A AAAT 

422867 


1 O.A4 AT 

L32137 


Hs.1584 


J A A A AT 

428227 


A AAA4A4A 

M321649 


Hs.2248 


AAA A A 4 

444381 


nrAA*JAAP 

BE387335 


1 l_ A00740 

Hs.283713 


4 A AO AO 

400303 


A A A 4 AT CO 

AA242758 


l l_ "7A4 OC 

Hs.79136 


AAA T A A 

411789 


AF245505 


1 l_ "704 C7 

Hs.72157 


Jnnonn 

428698 


A A A C A"7TO 

AA852773 


1 1 _ A A iQA 0 

Hs.334838 


4 rAAAfl 

450098 


lAIATA A A 

W27249 


1 1 o4 no 

HS.81U9 


4 a 4 r* r* a 

421552 


A rAAAAAA 

AF026692 


Hs.1 05700 


A C AT A T 

452747 


BE1 53855 


Hs.o14b0 


450375 


A A A AAA 4 T 

AA009647 




A A A A 4 r 

426215 


At AIOCO J 4 A 

AW963419 


Hs.loWZJ 


JOPA A T 

425247 


klii AArn A A 

NM_00594Q 


Hs. 1 00324 


A A A A A 4 

432201 


A 1 COQC4 O 

AI538613 


| l_ OAQOy|4 

HS.29oz41 


A ATfn f 

427585 


r\o 4 4 PA 

D31152 


HS.1/ 9/ 29 


A A A4 4 T 

442117 


A I A /A A 4 AA 4 

AW664964 


1 t_ 4 OQDOO 

Hs.l2ooyy 


4 A 4 A4 4 

431211 


■ JO AO 4 A 

M86849 




4 4 T AA A 

447033 


A1357412 


» i_ 4C7CA4 

Hs. iD/bUi 


4 A TA A A 

447033 


A 1 O f~T 4 4 A 

AI357412 


1 l_ 4 C*7Cri4 

HS.1o7bU1 


A 4TAAA 

447033 


A 1 O f"T 4 4A 

AI357412 


Hs.1o7b01 


115522 


nP*P»»( 4 A AT 

BE614387 


Hs.3dooyo 


4 4 A 4 4 A 

410418 


r*\ A 4 A A A 

D31382 


Hs.bdJ^o 


409041 


AB033025 


Hs.50081 


409041 


AB033025 


Hs.50081 


452461 


N78223 


Hs.108106 


412420 


AL035668 


Hs.73853 


416658 


U03272 


Hs.79432 


407811 


AW1 90902 


Hs.40098 



glutamate-cysteine ligase, catalytic sub 
ESTs, Weakly similar to T17330 hypotheti 
ESTs, Weakly similar to T17330 hypotheti 
ESTs, Weakly similar to T1 7330 hypotheti 
ESTs, Weakly similar to T17330 hypotheti 
ESTs, Weakly similar to T17330 hypotheti 
High mobility group (nonhistone chromoso 
NMJ)22342:Homo sapiens kinesin protein 9 
ESTs 

presenilis associated rhomboid-like pro 
nitric oxide synthase 2A (inducible, hep 
ATPase, Class Vf, type 11B 
forkhead box E1 (thyroid transcription f 
ESTs, Weakly similar to 2109260A B cell 
peptldytglycine aipha-amidating monooxyg 
hypothetical protein MGC5350 
ESTs 

unnamed protein product [Homo sapiens] 
minichromosome maintenance deficient (S. 
v-ets erythroblastosis virus E26 oncogen 
ESTs, Weakly similar to S41044 chromosom 
guanine nucleotide binding protein 11 
calcitonin receptor-like 
cadherin 5, type 2, VE-cadherin (vascula 
singed (Drosophila)-like (sea urchin fas 
Homo sapiens HSPC285 mRNA, partial cds 
complement component C1q receptor 
ESTs 

protease inhibitor 3, skin-derived (SKAL 
plakophilin 3 

RAN, member RAS oncogene family 
parathyroid hormone-like hormone 
low density lipoprotein receptor-related 
endogenous retroviral protease 
cotlagen, type Xt, alpha 1 
SRY (sex determining region Y)-box 4 
guanine monphosphate synthetase 
pituitary tumor-transforming 1 
insulin-like growth factor binding prote 
SRB7 (suppressor of RNA polymerase B, ye 
butyrate-induced transcript 1 
buty rate-induced transcript 1 
small proline-rich protein 1B (comifin) 
H2A histone family, member X 
gb:Homo sapiens full length Insert cDNA 
glycoprotein (transmembrane) nmb 
alpha-fetoprotein 

integrin, alpha 5 (fibronectin receptor, 
matrix metatloproteinase 10 (stromelysin 
matrix metatloproteinase 1 (interstitial 
matrix metalloproteinase 1 (interstitial 
solute carrier family 7, (cationic amino 
tissue factor pathway inhibitor 2 
G protein-coupled receptor 39 
periostin (OSF-2os) 
monokine induced by gamma interferon 
5T4 oncofetal trophoblast glycoprotein ■ 
5T4 oncofetal trophoblast glycoprotein 
cartilage oligomeric matrix protein (pse 
small inducible cytokine subfamily B (Cy 
ESTs, Weakly similar to S64054 hypotheti 
LIV-1 protein, estrogen regulated 
Adlican 

KIM1866 protein 

hypothetical protein FLJ21080 

secreted frizzled-related protein 4 

Ig superfamlly receptor LNIR 

a disintegrin and metalloproteinase doma 

stanniocalcin 2 

matrix metalloproteinase 1 1 (stromelysin 
Transmembrane protease, serine 3 
collagen, type X, alpha 1 (Schmid metaph 
ESTs; hypothetical protein for IMAGE:447 
gap junction protein, beta 2, 26kD (conn 
ESTs 
ESTs 
ESTs 

c-Myc target JP01 
transmembrane protease, serine 4 
Hypothetical protein, XPJJ51860 (KIAA119 
Hypothetical protein, XPJ51860 (KIAA1 19 
transcription factor 
bone morphogenetic protein 2 
fibrillin 2 (congenital contractual ara 
cysteine knot superfamily 1, BMP antagon 
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452401 
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Hs.406 


410407 
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AW341683 




412719 


AW016610 
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\ \ C\.A A A A, A, 

Hs.211092 
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M29540 


■ 4 A A A A A 

Hs.220529 


431846 
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Hs.271580 


422158 
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Hs.1 12341 
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t ft A A f* A *f 
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428484 
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431009 
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410555 
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410555 


■ 1 A A A A A 
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424687 
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■ 1 A f— A A A 
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410274 
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439606 
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NMJ>14400 


Hs.1 1950 
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ft Ik 4 A. A. f« A A A. 

NM_005329 


Hs.85962 
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Hs.78867 
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1 ■ AAA A*T 
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Hs.78867 
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U88967 


Hs.78867 


415817 


U88967 


Hs.78867 


415817 


1 r A A A A —t 

U88967 


Hs.78867 
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■ -m A A. A 

U88967 


Hs.78867 


421817 


AF1 46074 


II <4 A A A A A 

Hs. 108660 


418678 


NMJ)01327 


ft 1 A A A A. 

Hs. 167379 


418678 


NML001327 


Hs. 167379 


409420 


Z15008 


Hs.54451 


332180 


AF134160 


Hs.7327 


408790 


AW580227 


1 1 a v« AAA 

Hs.47860 


408790 


AW580227 


Hs.47860 


439223 


AW238299 


Hs.250618 


409757 


NM.001898 


1 1 ^ AAJ <t A 

Hs.123114 


428969 


AF1 20274 


Hs.194689 


428969 


a J A A A ^9 A 

AF1 20274 


Hs.194689 


428969 


AF1 20274 


li in jpnn 

Hs.194689 


428969 


A ^ J AAA n J 

AF1 20274 


ii a n jnnn 

Hs.194689 


450701 


* I A A. A 

H39960 


11 nnni n*7 

Hs.288467 


450701 


H39960 


Hs.288467 


414774 


x y Art J J A 

X02419 


1 1— "7*7 nv il 

Hs.77274 


407944 


R34008 


i l— n o mn - ? 

Hs.239727 


407944 


R34008 


Hs.239727 


457489 


AI693815 


Hs.1 27179 


429547 


AW009166 


Hs.99376 


407242 


M18728 




407242 


M18728 




407242 


M18728 




444006 


BE395085 


Hs.10086 



ESTs, Weakly similar to dJ36501 2.1 [H.sa 
ENSP00000251056*:Plasma membrane calcium 
cathepsin E 

cartilage acidic protein 1 
cartilage acidic protein 1 
cartilage acidic protein 1 
apotipoprotein L 

death receptor 6, TNF superfamily member 
sema domain, immunoglobulin domain (Ig), 
serine/threonine kinase 12 
Predicted cation efflux pump 
C15000305:gi|3806122|gb|AAC69198.1|(AFO 
C1 5000305:gi|38061 22jgb|AAC691 98. 1 j (AF0 
similar to lysosome-associated membrane 
small inducible cytokine subfamily B (Cy 
interleukln 1 receptor antagonist 
glypican 1 
aquaporin 4 
KIAA0877 protein 

chitinase 3-Iike 1 (cartilage glycoprote 
lung type-l cell membrane-associated gly 
tumor necrosis factor, alpha-induced pro 
tumor necrosis factor, alpha-induced pro 
solute carrier family 6 {neurotransmitte 
carbonic anhydrase IX 

gb:hd13d01,x1 Soares_NFLJ"J3BC_S1 Homos 
ESTs 

neurotensin 

chloride channel, calcium activated, fam 
laminin, beta 3 (nicein (125kD), kalinin 
desmoglein 3 (pemphigus vulgaris antigen 
matrix metalloproteinase 12 (macrophage 
desmocollin 3 
desmocoliin 3 

LUNX protein; PLUNC (palate lung and nas 
carcinoembryonic antigen-related cell ad 
uroplakin 1B 

protease inhibitor 3, skin-derived (SKAL 
cadherin 3, type 1, P-cadherin (placenta 
differentially expressed in Fanconi's an 
solute carrier family 7 (cationic amino 
gap junction protein, beta 5 (connexin 3 
midklne (neurite growth-promoting factor 
gap junction protein, beta 6 (connexin 3 
progestagen-associated endometrial prate 
melanoma cell adhesion molecule 
a dis'mtegrin and metalloproteinase doma 
a disintegrin and metalloproteinase doma 
matrix metalloproteinase 9 (gelatinase B 
integrin, beta 4 
hypoxia-inducible protein 2 • 
G protein-coupled receptor 87 
NM__005365:Homo sapiens melanoma antigen, 
GPI-anchored metastasis-associated prote 
hyaluronan synthase 3 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
protein tyrosine phosphatase, receptor-t 
ATP-binding cassette, sub-family C (CFTR 
cancer/testis antigen (NY-ESO-1) 
cancer/testis antigen (NY-ESO-1) 
laminin, gamma 2 (nicein (100kD), kalini 
claudin 1 

neurotrophic tyrosine kinase, receptor, 

neurotrophic tyrosine kinase, receptor, 

UL16 binding protein 2 

cystatin SN 

artemin 

artemin 

artemin 

artemin 

hypothetical protein XP_098151 (leucine- 
hypothetical protein XP_098151 (leucine- 
plasminogen activator, urokinase 
desmocollin 2 
desmocollin 2 
cryptic gene 
ESTs 

gb:Human nonspecific crossreacting antig 
gb:Human nonspecific crossreacting antig 
gb:Human nonspecific crossreacting antig 
type I transmembrane protein Fn14 
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TABLE 15B 



D No: 632 & 633 


429597 


NM_003816 


Hs.2442 


a dfsintegrin and metaffoproteinase doma 


D No: 634 & 635 


A n y— k A A A 

422109 


S73265 


| 1 i JHA 

Hs.1473 


gastrin-releasing peptide 


D No: 636 & 637 


419235 


AW47041 1 


l l Ann A no 

Hs.288433 


neurotnmin 


ft 1 A A A A\ A A 

D No: 638 & 639 


t J a a J A 

449048 


Z45051 


Hs.22920 


> 'k., i n n A JAil iiIaV a1.iaa.aa !_ J. ^ a 

similar to S68401 (cattle) glucose indue 


D No: 640 & 641 


419216 


AU076718 


Hs. 164021 


small inducible cytokine subfamily B (Cy 


D No: 642 & 643 


431462 


AW583672 


1 t A r» A A <J A 

Hs.256311 


granin-Iike neuroendocrine peptide precu 


D No: 644 & 645 


448243 


AW369771 


1 1 r A AAA 

Hs.52620 


mtegnn, beta 8 


D No: 646 & 647 


J A A j AT 

426427 


ft i n i*> n ri n 

M86699 


Hs. 169840 


TTK protein kinase 


D No: 648 & 649 


445537 


ft | /\ J — T J 

AJ245671 


Hs. 12844 


s~\ 111-—. * ~ — - — . - I 1 * - 1 „ /? 

EGF-like-domain, multiple 6 


D No: 650 & 651 


j a a a—* n 

422278 


AF072873 


Hs. 114218 


frizzled (Drosopnila) nomolog 6 


D No: 652 & 653 


j a a J r A 

428450 


NM_014791 


Hs.184339 


KIAA0175 gene product 


D No: 654 & 655 


446619 


AU076643 


1 |_ A j| A 

Hs.313 


secreted phosphoprotein 1 (osteopontin, 


D No: 656 & 657 


j m (-i A 

453392 


U23752 


1 Ia ohaP a 

Hs. 32964 


SRY (sex determining region Y)-box 1 1 


D No: 658 & 659 


j A A r~ J J 

426514 


BE616633 


Hs.170195 


bone morphogenetic protein 7 (osteogenic 


f \ L h A A /"\ A A 

D No: 660 & 661 


425776 


1 1 An J AO 

U25128 


11a a r*o Af\fm 

Hs. 159499 


parathyroid hormone receptor 2 


r— v ft i /-» a a. A n 

D No: 662 & 663 


425776 


U25128 


1 1- J f A J A A 

Hs. 159499 


parathyroid hormone receptor 2 


D No: 664 & 665 


431515 


NM_012152 


Hs.258583 


endothelial differentiation, lysophospha 


D No: 666 & 667 


a a A j j - A 

419452 


U33635 


1 1a AAf"T A 

Hs.90572 


PTK7 protein tyrosine kinase 7 


D No: 668 & 669 


A a a a r~ A 

432653 


ft 

N62096 


1 1a AAA iftp 

Hs.293185 


ESTs, Weakly similar to JC7o28 amino aci 


D No: 670 & 671 


A A A A 1— O 

432653 


N62096 


Hs,293185 


ESTs, Weakly similar to JC7328 amino aci 


D No: 672 & 673 


A AS ^\ A f A 

432653 


N62096 


Hs.293185 


ESTs, Weakly similar to JC7328 amino aci 


D No: 674 & 675 


432653 


ft. I^AnnA 

N62096 


■ t _ a a A4 nr 

Hs.293185 


ESTs, Weakly similar to JC7328 amino aci 


• ft ft n A #*i 

D No: 676 & 677 


J J Aft « i 

410001 


» r-K AlJ AAA 

AB041036 


Hs.57771 


kalhkrein 1 1 


D No: 678 & 679 


426501 


AW043782 


Hs.293616 


ESTs 


D No: 680 & 681 


408369 


R38438 


Hs.1 82575 


solute carrier family 15 (H??? transport 


D No: 682 & 683 


445413 


AA151342 


Hs.12677 


CGI-147 protein 


D No: 684 & 685 


422424 


AI1 86431 


Hs.296638 


prostate differentiation factor 


D No: 686 & 687 


428330 


L22524 


Hs.2256 


matrix metalloproteinase 7 (matrilysin, 


D No: 688 & 689 


420610 


AI683183 


Hs.99348 


distal-less homeo box 5 



Pkey: Unique Eos probeset identifier number 
CAT number: Gene cluster number 
Accession: Genbank accession numbers 



Pkey 
309931 
330493 
439285 

450375 

451320 



CAT Number 
AW341683 
33264_5 
47065J 

83327J 

86576J 



Accession 

M27826 R78416 AA307645 AW957879 AW957800 M633529 H03662 

AL133916 N79113 AF086101 N76721 AW950828 AA3640 13 AW9556 84 Al 346341 AI867454 N54784 AI655270 A1421279 AW014882 
AA775552 N62351 N59253 M626243 AI341407 BE175639 M456968 AI358918 AA457077 

AA009647 AA131254 AA374293 AW954405 H04410 AW606284 AA151166 BE157467 BE157601 H04384 W46291 AW663674 H04021 H01532 
AA190993 H03231 H59605 H01642 M852876 M113758 AA626915 AA746952 A1161014 AA099554 R69067 
AW1 1 8072 AI631 982 T1 5734 AA2241 95 AI701458 W201 98 F26326 AA890570 N90552 AW071 907 AI671 352 AI375892 T0351 7 R88265 
AM 24088 AA224388 A1084316 AI354686 T33652 A1140719 A172021 1 T03490 AI372637 T15415 AW205836 AA630384 T03515 T33230 
AA017131 M443303 T33623 AI222556T33511 T33785AI419606 D55612 



TABLE 15C 



Pkey: Unique number corresponding to an Eos probeset 

Ref: Sequence source. The 7 digit numbers in this column are Genbank Identifier (Gl) numbers. "Dunham I. et al." refers to the publication entitled The DNA 

sequence of human chromosome 22." Dunham I. et al., Nature (1999) 402:489-495. 

Strand: Indicates DNA strand from which exons were predicted. 
NLposition: Indicates nucleotide positions of predicted exons. 

Pkey Ref Strand NLposition 

402075 8117407 Plus 121907-122035,122804-122921,124019-124161,124455-124610,125672-126076 

403329 8516120 Pius 96450-96598 

403478 9958258 Plus 116458-116564 

404440 7528051 Plus 80430-81581 

404877 1519284 Plus 1095-2107 

405770 2735037 Plus 61057-62075 

405932 7767812 Minus 123525-123713 



188 



WO 02/086443 

Table 16 



PCT/US02/12476 



Seq ID NO: 1 DNA sequence 

Nucleic Acid Accession #: NM_001216 

Coding sequence : 43 1422 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



GCCCGTACAC 
AGCCCCTGGC 
CTGTCACTGC 
TCCCCCTTGG 
AGTGAAGAGG 
GAGGATCTAC 
TCCCTGAAGT 
AATAATGCCC 
CCGCCCTGGC 
CGCCCCCAGG 
CTCCCGCCGC 
CCTCCTGGGC 
CTGCACTGGG 
CCTGCCGAGA 
GGGCGCCCGG 
AGTGCCTATG 
CAGGTCCCAG 
TATGAGGGGT 
CAGACAGTGA 
GGTGACTCTC 
GAGGCCTCCT 
AATTCCTGCC 
ACCAGCGTCG 
GTGAGCTACC 
TGTGAGAAGG 
ATGCCACTTC 



11 

1 

ACCGTGTGCT 
TCCCTCTGTT 
TGCTTCTGAT 
GAGGAGGCTC 
ATTCACCCAG 
CTGGAGAGGA 
TAGAGGATCT 
ACAGGGACAA 
CCCGGGTGTC 
TCGCCGCCTT 
TCCCAGAACT 
TAGAGATGGC 
GGGCTGCAGG 
TCCACGTGGT 
GAGGCCTGGC 
AGCAGTTGCT 
GACTGGACAT 
CTCTGACTAC 
TGCTGAGTGC 
GGCTACAGCT 
TCCCTGCTGG 
TGGCTGCTGG 
CGTTCCTTGT 
GCCCAGCAGA 
CAGCCAGAGG 
CTTTTAACTG 



21 
I 

GGGACACCCC 
GATCCCGGCC 
GCCTGTCCAT 
TTCTGGGGAA 
AGAGGAGGAT 
GGATCTACCT 
ACCTACTGTT 
AGAAGGGGAT 
CCCAGCCTGC 
CTGCCCGGCC 
GCGCCTGCGC 
TCTGGGTCCC 
TCGTCCGGGC 
TCACCTCAGC 
CGTGTTGGCC 
GTCTCGCTTG 
ATCTGCACTC 
ACCGCCCTGT 
TAAGCAGCTC 
GAACTTCCGA 
AGTGGACAGC 
TGACATCCTA 
GCAGATGAGA 
GGTAGCCGAG 
CATCTGAGGG 
CCAAGAAATT 



31 
I 

ACAGTCAGCC 
CCTGCTCCAG 
CCCCAGAGGT 
GATGACCCAC 
CCACCCGGAG 
GAAGTTAAGC 
GAGGCTCCTG 
GACCAGAGTC 
GCGGGCCGCT 
CTGCGCCCCC 
AACAATGGCC 
GGGCGGGAGT 
TCGGAGCACA 
ACCGCCTTTG 
GCCTTTCTGG 
GAAGAAATCG 
CTGCCCTCTG 
GCCCAGGGTG 
CACACCCTCT 
GCGACGCAGC 
AGTCCTCGGG 
GCCGTGGTTT 
AGGCAGCACA 
ACTGGAGCCT 
GGAGCCGGTA 
TTTTAAAATA 



41 
I 

GCATGGCTCC 
GCCTCACTGT 
TGCCCCGGAT 
TGGGCGAGGA 
AGGAGGATCT 
CTAAATCAGA 
GAGATCCTCA 
ATTGGCGCTA 
TCCAGTCCCC 
TGGAACTCCT 
ACAGTGTGCA 
ACCGGGCTCT 
CTGTGGAAGG 
CCAGAGTTGA 
AGGAGGGCCC 
CTGAGGAAGG 
ACTTCAGCCG 
TCATCTGGAC 
CTGACACCCT 
CTTTGAATGG 
CTGCTGAGCC 
TTGGCCTCCT 
GAAGGGGAAC 
AGAGGCTGGA 
ACTGTCCTGT 
AATATTTATA 



51 
i 

CCTGTGCCCC 
GCAACTGCTG 
GCAGGAGGAT 
GGATCTGCCC 
ACCTGGAGAG 
AGAAGAGGGC 
AGAACCCCAG 
TGGAGGCGAC 
GGTGGATATC 
GGGCTTCCAG 
ACTGACCCTG 
GCAGCTGCAT 
CCACCGTTTC 
CGAGGCCTTG 
GGAAGAAAAC 
CTCAGAGACT 
CTACTTCCAA 
TGTGTTTAAC 
GTGGGGACCT 
GCGAGTGATT 
AGTCCAGCTG 
TTTTGCTGTC 
CAAAGGGGGT 
TCTTGGAGAA 
CCTGCTCATT 
AT 



Seq ID NO: 2 Protein sequence: 
Protein Accession #: NP 001207 



11 



21 



I 

MAPLCPSPWL 
GEEDLPSEED 
DPQEPQNNAH 
ELLGFQLPPL 
VEGHRF PAE I 
EEGSETQVPG 
DTLWGPGDSR 
GLLFAVTSVA 



PLLIPAPAPG 
SPREEDPPGE 
RDKEGDDQSH 
PELRLRNNGH 
HWHLSTAFA 
LDISALLPSD 
LQLNFRATQP 
FLVQMRRQHR 



LTVQLLLSLL 
EDLPGEEDLP 
WRYGGDPPWP 
SVQLTLPPGL 
RVDEALGRPG 
FSRYFQYEGS 
LNGRVIEASF 
RGTKGGVSYR 



31 

1 

LLMPVHPQRL 
GEEDLPEVKP 
RVSPACAGRF 
EMALGPGREY 
GLAVLAAFLE 
LTTPPCAQGV 
PAGVDSSPRA 
PAEVAETGA 



41 



PRMQEDSPLG 
KSEEEGSLKL 
QSPVDIRPQL 
RALQLHLHWG 
EGPEENSAYE 
IWTVFNQTVM 
AEPVQLNSCL 



51 
I 

GGSSGEDDPL 
EDLPTVEAPG 
AAFCPALRPL 
AAGRPGSEHT 
QLLSRLEEIA 
LSAKQLHTLS 
AAGDILALVF 



Seq ID NO: 3 DNA sequence 

Nucleic Acid Accession #: BC013923 

Coding sequence: 43 8-1391 



85 



AGCGGGGTTG 
GTGTTTGCAA 
AGAGGAGAGA 
TAATAATAAC 
TGATCCTGAT 
TCCTCGCGGA 
CCCGCGGGCC 
CCGCGCACAG 
AGCAAACTTC 
AAAACAGCCC 
AGCGGCGCAA 
TGGGCGCCGA 
AGCGGCTGCG 
AAACCAAGAC 
GCGGCAATAG 
AGCGCATGGA 
AGGACCAGCT 
AGCCCATGCA 
CCTACATGAA 
TGGCTCTTGG 
TTACCTCTTC 
GCATGTATCT 
CCCAGCACTA 
CACACATGTG 
GGAAATGGGA 
TCAAAAAAAA 
AACAC CAAT C 
GAGAGATCCT 
GGGGAGGGCG 
TTTAAAAGTT 
TAATATTTAG 
TTGTACAGTA 



11 
I 

TCTATTAACT 
AAG GGGG AAA 
GAAAGAAAGG 
AATCATCGGC 
TCCAGTTTGC 
GCCCTGCGCT 
CCCCAAAGTC 
CGCCCGCATG 
GGGGGGCGGC 
GGACCGCGTC 
GATGGCCCAG 
GTGGAAACTT 
AGCGCTGCAC 
GCTCATGAAG 
CATGGCGAGC 
CAGTTACGCG 
GGGCTACCCG 
CCGCTACGAC 
CGGCTCGCCC 
CTCCATGGGT 
CTCCCACTCC 
CCCCGGCGCC 
CCAGAGCGGC 
AGGGCCGGAC 
GGGGTGCAAA 
AAAAAAAAAA 
CCATCCACAC 
GGACTTCTTT 
GGGGAATGGA 
CTAGTGGTAC 
AGCTAGTCTC 
TTTATCGAGA 



21 



TGTTCAAAAA 

GTAGTTTGCT 

GAGAGAAGTT 

GGCGGCAGGA 

CTCTCTCTTT 

CCCGACACCC 

CCGGCCGGGC 

TACAACATGA 

GGCGGCAACT 

AAGCGGCCCA 

GAGAACCCCA 

TTGTCGGAGA 

ATGAAGGAGC 

AAGGATAAGT 

GGGGT CGGGG 

CACATGAACG 

CAGCACCCGG 

GTGAGCGCCC 

ACCTACAGCA 

TCGGTGGTCA 

AGGGCGCCCT 

GAGGTGCCGG 

CCGGTGCCCG 

AGCGAACTGG 

AGAGGAGAGT 

AAAATCCCAT 

TCACGCAAAA 

TKGGGGGACT 

CCTTGTATAG 

GGTAGGAGCT 

CAAGCGACGA 

TAAACATGGC 



31 

I 

GTATCAGGAG 
GCCTCTTTAA 
TGAGCCCCAG 
TCGGCCAGAG 
TTTTCCCCCA 
CCGCCCGCCT 
CGAGGGT CGG 
TGGAGACGGA 
CCACCGCGGC 
TGAATGCCTT 
AGATGCACAA 
CGGAGAAGCG 
ACCCGGATTA 
ACACGCTGCC 
TGGGCGCCGG 
GCTGGAGCAA 
GCCTCAATGC 
TGCAGTACAA 
TGTCCTACTC 
AGT CCGAGGC 
GCCAGGCCGG 
AACCCGCCGC 
GCACGGCCAT 
AGGGGGGAGA 
AAGAAACAGC 
CACCCACAGC 
ACCGCGATGC 
ATTTTTGTAC 
ATCTGGAGGA 
TTGCAGGAAG 
AAAAAATGTT 
AATCAAAATG 



41 

I 

TTGTCAAGGC 
GACTAGGACT 
GCTTAAGCCT 
GAGGAGGGAA 
AATTATTCTT 
CCCCTCCTCC 
CGGCCGCCGG 
GCTGAAGCCG 
GGCGGCCGGC 
CATGGTGTGG 
CTCGGAGATC 
GCCGTTCATC 
TAAATACCGG 
CGGCGGGCTG 
CCTGGGCGCG 
CGGCAGCTAC 
GCACGGCGCA 
CTCCATGACC 
GCAGCAGGGC 
CAGCTCCAGC 
GGACCTCCGG 
GCCCAGCAGA 
TAACGGCACA 
AATTTTCAAA 
ATGGAGAAAA 
AAATGACAGC 
CGACAAGAAA 
AGAGAAAACC 
AAGAAAGCTA 
TTTGCAAAAG 
TTAATATTTG 
TCCATTGTTT 



51 
I 

AGAGAAGAGA 
GAGAGAAAGA 
TTCCAAAAAA 
GCGCTTTTTT 
CGCCTGATTT 
TCTCCCCCCG 
CGGGCCGGGC 
CCGGGCCCGC 
GGCAACCAGA 
TCCCGCGGGC 
AGCAAGCGCC 
GACGAGGCTA 
CCCCGGCGGA 
CTGGCCCCCG 
GGCGTGAACC 
AGCATGATGC 
GCGCAGATGC 
AGCTCGCAGA 
ACCCCTGGCA 
CCCCCTGTGG 
GACATGATCA 
CTTCACATGT 
CTGCCCCTCT 
GAAAAACGAG 
CCCGGTACGC 
TGCAAAAGAG 
ACTTTTATGA 
TGGGGAGGGT 
CGAAAAACTT 
TCTTTACCAA 
CAAGCAACTT 
ATAAGCTGAG 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 



60 
120 
180 
240 
300 
360 
420 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 



189 



10 



15 



WO 02/086443 

AATTTGCCAA TATTTTTCAA 
TTAGGACAGT TGCAAACGTG 
TAAAAATTGT ACAAAAGGAA 
GTTTAAAAAG GGCAAAAGTT 
AAATGG C CAT GCAGGTTGAC 
TTCCATTTTG TTCAGATAAA 
GTTTGTAATA TTTCTGTAAA 
GTAGTTGTAT TTTAAAAGAT 
GTATATATTT GAACTAATAT 
CCATTATGCA CAGTTTGAGA 
AAAAAAACAA AACAAAAAAA 
CACAACACAA AAACAAAAAA 
CCACAACACA AACAACAACA 



PCT/US02/12476 



GGAGAGGCTT 
AAAAGAAGAA 
AAAATTAGAA 
TTAGACTGTA 
ACCGTTGGTA 
AAAAACCATG 
TTTATTGTGA 
TCGGCTCTGT 
CATCCTTATA 
TAAATAAATT 
CAAAAAACAA 
AAAAAAAAGA 
CACAGAGGG 



CTTGCTGAAT 
AATTATTCAA 
TAAGTACTGG 
CTAAATTTTA 
ATTTATAATA 
AAATTACTGT 
TATTTTAAGG 
ATTATTTGAA 
ACAGGTACAT 
TTTGAAATAT 
AAACAGAAAA 
AACAAACACA 



TTTGATTCTG 
ATTTGGACAT 
CGAACCATCT 
TAACTTACTG 
GCTTTTGTTC 
GTTTGAAATA 
TTTTCCCCCC 
TCAGTCTGCC 
TTTCAACTTA 
GGACACTGAA 
AACAAAAAAA 
CAACACAACA 



CAGCTGAAAT 1980 

TTTAATTGTT 2040 

CTGTGGTCTT 2100 

TTAAAAGCAA 2160 

GATCCCAACT 2220 

TTTTCTTATG 22 80 

TTTATTTTCC 2 340 

GAGAATCCAT 2400 

AGTTTTTACT 24 60 

AAAAAAAAAA 2520 

AAAACAAAAC 2580 

C AAC ACAAAA 2 640 



Seq ID NO: 4 Protein sequence: 
Protein Accession #:CAA83435.1 



20 



25 



MYNMMETELK 
QENPKMHNSE 
KKDKYTLPGG 
PQHPGLNAHG 
GSWKSEASS 
GPVPGTAING 



11 

i 

PPGPQQTSGG 
ISKRLGAEWK 
IiLAPGGNSMA 
AAQMQPMHRY 
SPPWTSSSH 
TLPLSHM 



21 
) 

GGGNS TAAAA 
LLSETEKRPF 
SGVGVGAGLG 
DVSALQYNSM 
SRAPCQAGDL 



GGNQKNSPDR 
IDEAKRLRAL 
AGVNQRMDSY 
TSSQTYMNGS 
RDMISMYLPG 



41 
i 

VKRPMNAFMV 
HMKEHPDYKY 
AHMNGWSNGS 
PTYSMSYSQQ 
AEVPEPAAPS 



51 
I 

WSRGQRRKMA 60 

RPRRKTKTLM 120 

YSMMQDQLGY 180 

GTPGMALGSM 240 

RLHMSQHYQS 300 



30 



35 



40 



Seq ID NO: 5 DNA sequence 
Nucleic Acid Accession #: U91618 
Coding sequence: 2 9-541 



11 



45 



, CGGACTTGGC 
CATGCTACTC 
AGCATTAGAA 
TCCCTCTTGG 
AGCTGAGGAA 
TGCTTTAGAT 
TCACAGCAGG 
TGACAAAAAT 
GCTGTATGAG 
AGAGAATAAA 
ATTATATTTG 
ATTGAATGTG 
TCTTCAAAAA 



TTGTTAGAAG 
CTGGCTTTCA 
GCAGATTTCT 
AAGATGACTC 
ACAGGAGAAG 
GGCTTTAGCT 
GCTTTTCAAC 
GGAAAGGAAG 
AATAAACCCA 
TCATTTATTT 
TGTGAAAATG 
TTTTTCTGCA 
AAAAAAAAAA 



21 

I 

GCTGAAAGAT 
GCTCCTGGAG 
TGACCAATAT 
TGCTAAATGT 
TTCATGAAGA 
TGGAAGCAAT 
ACTGGGAGTT 
AAGT CAT AAA 
GAAGACCCTA 
ACATGTGATT 
TGACAAACAC 
CTAATAGAAA 
AAATGGGGCC 



31 

[ 

GATGGCAGGA 
TCTGTGCTCA 
GCATACATCA 
TTGCAGTCTT 
GGAGCTTGTT 
GTTGACAATA 
AATCCAGGAA 
GAGAAAAATT 
CAT ACT CAAA 
GTGATTCATC 
ACTTATCTGT 
TTAGACTAAG 
GCAATT 



41 
I 

ATGAAAATCC 
GATT CAGAAG 
AAGATTAGTA 
GTAAATAATT 
GCAAGAAGGA 
TACCAGCTCC 
GATATTCTTG 
CCTTATATTC 
AGAGATTCTT 
ATCCCTTAAT 
CTCTTCTACA 
TGTTTTCAAA 



51 

i 

AGCTTGTATG 60 

AGGAAATGAA 120 

AAGCACATGT 180 

TGAACAGCCC 240 

AACTTCCTAC 3 00 

ACAAAATCTG 3 60 

ATACTGGAAA 420 

TGAAACGGCA 480 

ACTATTACTG 540 

TAAATATCAA 600 

ATTGTGGTTT 660 

TAAATCTAAA 720 



Seq ID NO: 6 Protein sequence: 
50 Protein Accession #: AAB50564 

1 11 21 31 41 51 

I l l l l l 

MMAGMKIQLV CMLLLAFSSW SLCSDSEEEM KALEADFLTN MHTSKISKAH VPSWKMTLLN 

55 VCSLVNNLNS PAEETGEVHE EELVARRKLP TALDGFSLEA MLTIYQLHKI CHSRAFQHWE 

LIQEDILDTG NDKNGKEE V I KRKIPYILKR QLYENKPRRP YILKRDSYYY 



60 
120 



60 



Seq ID NO: 7 DNA sequence 

Nucleic Acid Accession #: NM_0 0 653 6.2 

Coding sequence: 109-2 940 



65 



70 



75 



80 



85 



ACCTAAAACC 
ATGTATGCAG 
AGCATTGCAG 
GAACTCCCAT 
ATTGCAATTA 
ATAACTGAAG 
ATAAAGATTT 
TCATATGAAA 
TACACCCTAC 
TTCCTACTGA 
GAATGGGCCC 
ATAAATGGGC 
GTGTGTGAAA 
GGATGCACCT 
AGTTTATCTT 
CTACAGAACC 
TTTCACCACA 
GTACAGGCTG 
GCTGACAGAC 
ATTCATACCT 
CACCAAATTA 
TCAGCTAAAA 
AAACTGAATG 
CTTCTTGGCA 



11 
I 

TTGCAAGTTC 
CAGGCTCAGT 
GTCCTATTTG 
TCCTGGGAGC 
ATCCTCAGGT 
CTTCATTTTA 
TAATACCTGC 
AGGCAAATGT 
AATACAGAGG 
ATGATAACTT 
ACCTCCGTTG 
AAAATCAAAT 
AAGGTCCTTG 
TTATCTACAA 
CTGTGGTTGA 
AGATGTGCAG 
GCTTTCCCAT 
GTGACAAAGT 
TCCTTCAACT 
TCGTGGGCAT 
ACAGCAATGA 
CAGACATCAG 
GAAAAGCTTA 
ATTGCTTACC 



21 
! 

AGGAAGAAAC 
GTGAGTGAAC 
CAACCTGAAG 
TGGAGTACAG 
ACCTGAGAAT 
CCTATTTAAT 
CACATGGAAA 
CATAGTGACT 
GTGTGGAAAA 
AACAGCTGGC 
GGGTGTGTTC 
TAAAGTGACA 
CCCCCAAGAA 
TAGCACCCAA 
ATTTTGTAAT 
CCTCAGAAGT 
GAATGGGACT 
GGTCTGTTTA 
ACAACAAGCC 
TGCCAGTTTC 
TGATCGAAAG 
CATTTGTTCA 
TGGCTCTGTG 
CACTGTGCTC 



31 

I 

CATCTGCATC 
TGGAGGCTTC 
TTTGTGACTC 
CTTCAAGACA 
CAGAACCTCA 
GCTACCAAGA 
GCTAATAATA 
GACTGGTATG 
GAGGGAAAAT 
TACGGATCAC 
GATGAGTATA 
AGGTGTTCAT 
AACTGTATTA 
AATGCAACTG 
GCAAGTACCC 
GCATGGGATG 
GAGCTTCCAC 
GTGCTGGATG 
GCAGAATTTT 
GACAGCAAAG 
TTGCTGGTTT 
GGGCTTAAGA 
ATGATATTAG 
AGCAGTGGTT 



41 

I 

CATATTGAAA 
TCTACAACAT 
TCCTGGTTGC 
ATGGGTATAA 
TCTCAAACAT 
GAAGAGTATT 
ACAGCAAAAT 
GGG CACATGG 
ACATTCATTT 
GAGGCCGAGT 
ACAATGACAA 
CTGACATCAC 
TTAGTAAGCT 
CATCAATAAT 
ACAACCAAGA 
TAATCACAGA 
CTCCTCCCAC 
TGTCCAGCAA 
ATTTGATGCA 
GAGAGATCAG 
CATATCTGCC 
AAGGATTTGA 
TGACCAGCGG 
CAACAATTCA 



51 
I 

ACCTGACACA 60 

GACCCAAAGG 120 

CTTAAGTTCA 180 

TGGATTGCTC 240 

TAAGGAAATG 300 

TTTCAGAAAT 360 

AAAACAAGAA 420 

AGATGATCCA 480 

CACACCTAAT 540 

GTTTGTCCAT 600 

ACCTTTCTAC 660 

AGGCATTTTT 720 

TTTTAAAGAA 780 

GTTCATGCAA 840 

AGCACCAAAC 900 

CTCTGCTGAC 960 

ATTCTCGCTT 1020 

GATGGCAGAG 1080 

GATTGTTGAA 1140 

AGCCCAGCTA 1200 

CACCACTGTA 1260 

GGTGGTTGAA 1320 

AGATGATAAG 1380 

CTCCATTGCC 1440 



190 



10 



15 



20 



25 



30 



35 



WO 02/086443 

CTGGGTTCAT CTGCAGCCCC 
TTCTTTGTTC CAGATATATC 
TCTGGAACTG GAGACATTTT 
AAACCTCACC AT CAATTGAA 
ATGTTTCTAG TTACGTGGCA 
GGACGAAAAT ACTACACAAA 
TGGATTCCAG GAACAGCTAA 
TCTCTGCAAG CCCTGAAAGT 
GCCACTGTGG AAGCCTTTGT 
TATGCCAATG TGAAACAGGG 
GAGCCAGAGA CTGGAGATCC 
GTTATAAAAA ATGATGGAAT 
TATAGCTTGA AAGTGCATGT 
CCAGGGAGTC ATGCTATGTA 
GCTCCAAGGA AATCAGTAGG 
AGCTCAGGAG GCTCCTTTTC 
CCACCATGCA AAATTATTGA 
TGGACAGCAC CTGGAGAAGA 
AGT AAAAGT C TACAGAATAT 
AAGCGAAATC CTCAGCAAGC 
ACGAATGGAC CTGAACATCA 
GCAATACGAG CAATGGATAG 
CCTCTGTTTA TTCCCCCCAA 
GGAQTTTTAA CAGCAATGGG 
CATACTTTAA GCAGGAAAAA 
ATAAATATCC AAAGTGT CTT 
CATACTAACA AAGTCAAATT 
ATACAGATAA GATTTTTACA 
CCTTACACTT TGGCTATGAA 
GCAAAGGGAA GGGTAAAGTC 
AATAGCCCCA AGCAGAGAAA 
TCATTTAGTT ACTTTGATTA 
TTTACATGAA GATCATGCTA 
CTTGCTATTT TGTTATATAT 
TTTCACTGTA AGAGGTAACC 
TTTATGACAA AGGTCTATTG 
TTTCTAAGTT TATTGCCTTG 
TACCTAGGAA A 
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AAAT CTGGAG 
AAACTCCAAT 
CCAGCAACAT 
AAACACAGTG 
GGCCAGTGGT 
TAATTTTATC 
GCCTGGGCAC 
GACAGTGACC 
GGAAAGAGAC 
ATTTTATCCC 
TGTTACGCTG 
TTACTCGAGG 
CAATCACTCT 
TGTACCAGGT 
CAGAAATGAG 
AGTGCTGGGA 
CCTGGAAGCT 
CTTTGATCAG 
CCAAGATGAC 
TGGCATCAGG 
GCCAAATGGA 
GAACTCCTTA 
TTCTGATCCT 
TTTGATAGGA 
GAGAGCAGAC 
CCTTCTTAGA 
AACATCAAAA 
TGGTAGATCA 
CAAATAATAA 
GGACCAGTGT 
AGGAGGGTAG 
ATTTTTCTTT 
TATTTTATAT 
ATTTCAGATG 
TTTAACAATA 
AATTTATTTG 
GGTTATTATG 



GAATTAT CAC 
AGCATGATTG 
ATTCAGCTTG 
ACTGTGGATA 
CCTCCTGAGA 
ACCAATCTAA 
TGGACTTACA 
TCTCGCGCCT 
AGCCTCCATT 
AT T CTTAATG 
AGACTCCTTG 
TATTTTTTCT 
CCCAGCATAA 
TACACAGCAA 
GAGGAGCGAA 
GTTCCAGCTG 
G T AAAAGT AG 
GGCCAGGCTA 
TTTAACAATG 
GAGATATTTA 
GAAACACATG 
CAGTCTGCTG 
GTACCTGCCA 
ATCATTTGCC 
AAGAAAGAGA 
TATAAGACCC 
CTGTATTAAA 
ACAATTCTTT 
AAATTATTCT 
CAAGGAAAGT 
GTCTGCATTA 
TCTCCTTATC 
ATGTAGCCCC 
ACATCTCCCT 
TGGGTATTAC 
TNTGTAAGTT 
GAATGATAGT 



GTCTTACAGG 
ATGCTTTCAG 
AAAGTACAGG 
ATACTGTGGG 
TTATATTATT 
CTTTTCGGAC 
CCCTGAACAA 
CCAACTCAGC 
TTCCTCATCC 
CCACTGTCAC 
ATGATGGAGC 
CCTTTGCTGC 
GCACCCCAAC 
ACGGTAATAT 
AGTGGGGCTT 
GCCCCCACCC 
AAGAGGAATT 
CAAGCTATGA 
CTATTTTAGT 
CGTTCTCACC 
AAAGCCACAG 
TAT CTAACAT 
GAG ATTAT CT 
TTATTATAGT 
ATGGAACAAA 
ATGGCCTTCG 
ATGCATTGAG 
TTGGGGGTAG 
TTAAAGTAAT 
TTGTTTTATT 
TAACTGTCTG 
TGTGCAGTAC 
TAATGCAAAG 
GCTAATGCTC 
CTTTGTCTCT 
TCTACTCCCA 
TATAGCCCCN 



AGGTTTAAAG 1500 

TAGAATTTCC 1560 

TGAAAATGTC 1620 

CAACGACACT 1680 

TGAT CCTGAT 1740 

AGCTAGTCTT 1800 

TACCCATCAT 1860 

TGTGCCCCCA 1920 

TGTGATGATT 1980 

TGCCACAGTT 2040 

AGGTGCTGAT 2100 

AAATGGTAGA 2160 

CCACTCTATT 2220 

TCAGATGAAT 22 80 

TAGCCGAGTC 2340 

TGATGTGTTT 2400 

GACCCTATCT 24 60 

AATAAG AATG 2520 

AAATACATCA 2580 

CCAGATTTCC 2 640 

AATTTATGTT 2 700 

TGCCCAGGCG 2760 

TATATTGAAA 2820 

TGTGACACAT 2880 

ATTATTATAA 2 940 

ACTACAAAAA 3 00 0 

TTTTTGTACA 3 0 60 

ATTAGAAAAC 3120 

GTCTTTAAAG 3180 

GAGGTGGAAA 3240 

TGTGAAGCAA 3300 

AGGTTGCTTG 3360 

CTCTTTACCT 3420 

AGAGATCTTT 3480 

TCATACCGGT 3 540 

TCAAAGCAGC 3600 

TATAATGCCT 3660 



40 



Seq ID NO: 8 Protein secpience : 
Protein Accession #: NP 006527.1 



11 



45 



50 



55 



60 



MTQRSIAGPI 
IKEMITEASF 
GDDPYTLQYR 
KPFYINGQNQ 
MFMQSLSSW 
TFSLVQAGDK 
RAQLHQINSN 
GDDKLLGNCL 
SRISSGTGDI 
FDPDGRKYYT 
AVPPATVEAF 
AGADV I KNDG 
IQMNAPRKSV 
LTLSWTAPGE 
PQISTNGPEH 
LILKGVLTAM 



CNLKFVTLLV 
YLFNATKRRV 
GCGKEGKYIH 
IKVTRCSSDI 
EFCNASTHNQ 
WCLVLDVSS 
DDRKLLVSYL 
PTVLSSGSTI 
FQQHIQLEST 
NNFITNLTFR 
VERDSLHFPH 
IYSRYFFSFA 
GRNEEERKWG 
DFDQGQATSY 
QPNGETHESH 
GLIGIICLII 



21 

I 

AIiSSELPFLG 
FFRNIKILIP 
FTPNFLLNDN 
TGI FVCEKGP 
EAPNLQNQMC 
KMAEADRLLQ 
PTTVSAKTDI 
HSIALGSSAA 
GENVKPHHQL 
TASIiWIPGTA 
PVMIYANVKQ 
ANGRYSLKVH 
FSRVSSGGSF 
EIRMSKSLQN 
RIYVAIRAMD 
WTHHTLSRK 



31 

AGVQLQDNGY 
ATWKANNNSK 
LTAGYGSRGR 
CPQENCIISK 
SLRSAWDVIT 
LQQAAEFYLM 
SICSGLKKGF 
PNIiEELSRLT 
KNTVTVDNTV 
KPGHWTYTLN 
GFYPILNATV 
VNHSPSISTP 
SVLGVPAGPH 
IQDDFNNAIL 
RNSLQSAVSN 
KRADKKENGT 



41 
I 

NGLLIAINPQ 
IKQESYEKAN 
VFVHEWAHLR 
LFKEGCTFIY 
DSADFHHSFP 
QIVEIHTFVG 
EWEKLNGKA 
GGLKFFVPDI 
GNDTMFLVTW 
NTHHSLQALK 
TATVEPETGD 
AHS I PGSHAM 
PDVFPPCKII 
VNTSKRNPQQ 
IAQAPLFIPP 
KLL 



51 
I 

VPENQNLISN 60 

VIVTDWYGAH 120 

WGVFDEYNND 180 

NSTQNATASI 240 

MNGTELPPPP 300 

IASFDSKGEI 360 

YGSVMILVTS 42 0 

SNSNSMIDAF 480 

QASGPPEIIL 540 

VTVTSRASNS 600 

PVTLRLLDDG 660 

YVPGYTANGN 720 

DLEAVKVEEE 780 

AGIREIFTFS 840 

NSDPVPARDY 900 



Seq ID NO: 9 DNA sequence 
Nucleic Acid Accession #: Eos sequence 
65 Coding sequence: 336-632 

1 11 21 31 41 51 

l I l l l I 

CTCCCCTCAC CCCGGTCCAG GATGCCCAGT CCCCACGACA CCTCCCACTT CCCACTGTGG 60 

70 CCTGGGTGGG CTCAGGGGCT GCCCTTGACC TGGCCTAGAG CCCTCCCCCA GCTGGTGGTG 120 

GAGCTGGCAC TCTCTGGGAG GGAGGGGGCT GGGAGGGAAT GAGTGGGAAT GGCAAGAGGC 180 

CAGGGTTTGG TGGGATCAGG TTGAGGCAGG TTTGGTTTCC TTAAAATGCC AAGTTGGGGG 240 

CCAGTGGGGC CCACATATAA ATCCTCACCC TGGGAGCCTG GCTGCCTTGC TCTCCTTCCT 300 

GGGTCTGTCT CTGCCACCTG GTCTGCCACA GATCCATGAT GTGCAGTTCT CTGGAGCAGG 360 

75 CGCTGGCTGT GCTGGTCACT ACCTTCCACA AGTACTCCTG CCAAGAGGGC GACAAGTTCA 420 

AGCTGAGTAA GGGGGAAATG AAGGAACTTC TGCACAAGGA GCTGCCCAGC TTTGTGGGGG 480 

AGAAAGTGGA TGAGGAGGGG CTGAAGAAGC TGATGGGCAG CCTGGATGAG AACAGTGACC 540 

AG CAGGTGG A CTTCCAGGAG TATGCTGTTT TCCTGGCACT CATCACTGTC ATGTGCAATG 600 

ACTTCTTCCA GGGCTGCCCA GACCGACCCT GAAGCAGAAC TCTTGACTTC CTGCCATGGA 660 

80 TCTCTTGGGC CCAGGACTGT TGATGCCTTT GAGTTTTGTA TTCAATAAAC TTTTTTTGTC 720 

TGTTGATAAT ATTTTAATTG CTCAGTGATG TTCCATAACC CGGCTGGCTC AGCTGGAGTG 780 

CTGGGAGATG AGGGCCTCCT GGATCCTGCT CCCTTCTGGG CTCTGACTCT CCTGGAAATC 840 

TCTCCAAGGC CAGAGCTATG CTTTAGGTCT CAATTTTGGA ATTTCAAACA CCAGCAAAAA 900 

ATTGGAAATC GAGATAGGTT GCTGACTTTT ATTTTGTCAA ATAAAGATAT TAAAAAAGGC 960 

85 AAAT AC CA 

Seq ID NO: 10 Protein sequence: 



191 



WO 02/086443 

Protein Accession #: NP__005969.1 

1 11 21 31 41 51 

I I i I l l 

MMCSSLEQAL AVLVTTFHKY SCQEGDKFKL SKGEMKELLH KELPSFVGEK VDEEGLKKLM 
GSLDENSDQQ VDFQEYAVFL ALITVMCNDF FQGCPDRP 



Seq ID NO: 11 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 336-62 6 

1 11 21 31 41 51 

1 I I I I I 

CTCCCCTCAC CCCGGTCCAG GATGCCCAGT CCCCACGACA CCTCCCACTT CCCACTGTGG 

CCTGGGTGGG CTCAGGGGCT GCCCTTGACC TGGCCTAGAG CCCTCCCCCA GCTGGTGGTG 

GAGCTGGCAC TCTCTGGGAG GGAGGGGGCT GGGAGGGAAT GAGTGGGAAT GGGAAGAGGC 

CAGGGTTTGG TGGGATCAGG TTGAGGCAGG TTTGGTTTCC TTAAAATGCC AAGTTGGGGG 

CCAGTGGGGC CCACATATAA ATCCTCACCC TGGGAGCCTG GCTGCCTTGC TCTCCTTCCT 

GGGTCTGTCT CTGCCACCTG GTCTGCCACA GATCCATGAT GTGCAGTTCT CTGGAGCAGG 

CGCTGGCTGT GCTGGTCACT ACCTTCCACA AGTACTCCTG CCAAGAGGGC GACAAGTTCA 

AGCTGAGTAA GGGGGAAATG AAGGAACTTC TGCACAAGGA GCTGCCCAGC TTTGTGGGGC 

ATTCCAGAGA ACCATGTGGT GTGAGGGCCT TCCGAGTCCA TCTGTTTAAT CCTGT CATTG 

GAGACTTGAG AAACCAGAGC CCAGAAGGGA AAAGTGATTG TCCCAAGATC ACACAGCACT 

GGAGAAAGTG GATGAGGAGG GGCTGAAGAA GCTGATGGGC AGCCTGGATG AGAACAGTGA 

CCAGCAGGTG GACTTCCAGG AGTATGCTGT TTTCCTGGCA CTCATCACTG TCATGTGCAA 

TGACTTCTTC CAGGGCTGCC CAGACCGACC CTGAAGCAGA ACTCTTGACT TCCTGCCATG 

GATCTCTTGG GCCCAGGACT GTTGATGCCT TTGAGTTTTG TATTCAATAA ACTTTTTTTG 

TCTGTTGATA ATATTTTAAT TGCTCAGTGA TGTTCCATAA CCCGGCTGGC TCAGCTGGAG 

TGCTGGGAGA TGAGGGCCTC CTGGATCCTG CTCCCTTCTG GGCTCTGACT CTCCTGGAAA 

TCTCTCCAAG GCCAGAGCTA TGCTTTAGGT CTCAATTTTG GAATTTCAAA CACCAGCAAA 

AAATTGGAAA TCGAGATAGG TTGCTGACTT TTATTTTGTC AAATAAAGAT ATTAAAAAAG 

GCAAATACCA 

Seq ID NO: 12 Protein sequence: 
Protein Accession # : Eos sequence 

1 11 21 31 41 51 

l l I I l l 

MMCSSLEQAL AVLVTTFHKY SCQEGDKFKL SKGEMKELLH KELPSFVGHS REPCAVRAFR 
VHLFNPVIGD LRNQSPEGKS DCPKITQHWR KWMRRG 



Seq ID NO: 13 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 58-354 

1 11 21 31 41 51 

l I I I l l 

GTGAGCTCAC CATGTGGGGG TGAGGCTGAG AGAAAACAAG TACACAGCCA CAGATCCATG 
ATGTGCAGTT CTCTGGAGCA GGCGCTGGCT GTGCTGGTCA CTACCTTCCA CAAGTACTCC 
TGCCAAGAGG GCGACAAGTT CAAGCTGAGT AAGGGGGAAA TGAAGGAACT TCTGCACAAG 
GAGCTGCCCA GCTTTGTGGG GGAGAAAGTG GATGAGGAGG GGCTGAAGAA GCTGATGGGC 
AGCCTGGATG AGAACAGTGA CCAGCAGGTG GACTTCCAGG AGTATGCTGT TTTCCTGGCA 
CTCATCACTG TCATGTGCAA TGACTTCTTC CAGGGCTGCC CAGACCGACC CTGAAGCAGA 
ACTCTTGACT TCCTGCCATG GATCTCTTGG GCCCAGGACT GTTGATGCCT TTGAGTTTTG 
TATTCAATAA ACTTTTTTTG TCTGTTGATA ATATTTTAAT TGCTCAGTGA TGTTCCATAA 
CCCGGCTGGC TCAGCTGGAG TGCTGGGAGA TGAGGGCCTC CTGGATCCTG CTCCCTTCTG 
GGCTCTGACT CTCCTGGAAA TCTCTCCAAG GCCAGAGCTA TGCTTTAGGT CTCAATTTTG 
GAATTTCAAA CACCAGCAAA AAATTGGAAA TCGAGATAGG TTGCTGACTT TTATTTTGTC 
AAATAAAGAT ATTAAAAAAG GCAAATACCA 

Seq ID NO: 14 Protein sequence: 
Protein Accession #: NP_005969.1 

1 ll 21 31 41 51 

l l l I 1 I 

MMCSSLEQAL AVLVTTFHKY SCQEGDKFKL SKGEMKELLH KELPSFVGEK VDEEGLKKLM 
GSLDENSDQQ VDFQEYAVFL ALITVMCNDF FQGCPDRP 



Seq ID NO: 15 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 62-3 58 

1 11 21 31 41 51 

I I l l l l 

GGAGGGTGTG CCGCTGAGTC ACTGCCTGGG CATCTGGGCC TGGAACCTCG GCCACAGATC 
CATGATGTGC AGTTCTCTGG AGCAGGCGCT GGCTGTGCTG GTCACTACCT T CCACAAGT A 
CTCCTGCCAA GAGGGCGACA AGTTCAAGCT GAGTAAGGGG GAAATGAAGG AACTTCTGCA 
CAAGGAGCTG CCCAGCTTTG TGGGGGAGAA AGTGGATGAG GAGGGGCTGA AGAAGCTGAT 
GGGCAGCCTG GATGAGAACA GTGACCAGCA GGTGGACTTC CAGGAGTATG CTGTTTTCCT 
GGCACTCATC ACTGTCATGT GCAATGACTT CTTCCAGGGC TGCCCAGACC GACCCTGAAG 
CAGAACTCTT GACTTCCTGC CATGGATCTC TTGGGCCCAG GACTGTTGAT GCCTTTGAGT 
TTTGTATTCA ATAAACTTTT TTTGTCTGTT GATAATATTT TAATTGCTCA GTGATGTTCC 
ATAACCCGGC TGGCTCAGCT GGAGTGCTGG GAGATGAGGG CCTCCTGGAT CCTGCTCCCT 
TCTGGGCTCT GACTCTCCTG GAAATCTCTC CAAGGCCAGA GCTATGCTTT AGGTCTCAAT 
TTTGGAATTT CAAACACCAG CAAAAAATTG GAAATCGAGA TAGGTTGCTG ACTTTTATTT 



192 



10 



WO 02/086443 

TGTCAAATAA AGATATTAAA AAAGGCAAAT ACCA 

Seq ID NO: 16 Protein sequence: 
Protein Accession #: NP_005 969.1 

1 11 21 31 41 51 

1 1 1 I I I 

MMCSSLEQAL AVLVTTFHKY SCQEGDKFKL SKGEMKELLH KELPSFVGEK VDEEGLKKLM 

GSLDENSDQQ VDFQEYAVFL AL I T VMCNDF FQGCPDRP 



60 
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15 



Seq ID NO: 17 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 93 9-2372 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



85 



i 
I 

AAGACGGATT 
AGAATAGTTA 
CCCGAGGCTC 
CGCGGGCGCA 
AACCAAGCAC 
CTGTGGTGTG 
AATTTTCTGG 
GCAGAGGCGG 
CGCTCGCGCT 
GGCGGGCGTG 
AACAAGGAAT 
GGGCCATGCA 
GGTTCGCTAT 
ACCAGCTCAG 
GAGAGCCGCA 
GCGGGGACAG 
ATGGACCCGC 
CCGCTTTCGC 
CTTCTCCTGG 
TCAGCGAAAT 
AAGCTTATGT 
ATAAAGCATT 
CGAGTTTGTC 
ATCCATTTAC 
GTCCAGACAC 
ACCTGCAGAT 
TGGAGGAAGG 
TGTAT TGGGA 
GCTCCTTAAG 
CGGAAAATCT 
CTAT CACATT 
AAGGCAACCC 
AATACATCTG 
TGGATAATCG 
GGAAGGATGA 
CAAACCCAAA 
GGGACACCAC 
GGGAACATCT 
TGGTAATGCT 
TTTTGTTTCA 
GGCTGTGGTG 
CTTATCCCGG 
GCTGTACTAT 
GTAACTCTCA 
TTACAGTAGT 
AAAGTGTGCT 
TTGACCTGCA 
GTCTAATCTA 
TTCAGAGGGT 
ACCATCACTT 
GTCCAAATGT 
TTAGCCAGCA 
AAGAAAAAAA 
GGCATAGTCA 
TTGCCCTTTT 
AGGCCACAGT 
CCTGGGAGCA 
CCCCCTACAA 
CCAGCAGCAA 
TGCTGAGAGG 
ACACCTGTTT 
CAGGCAGTAT 
TGTTCCTTTT 
AATCAGCTCT 
TTTTAAAAAT 
T CTAT AG ATT 
CAAGGCATTA 
TCCATAATGA 
ATGAAGACCT 



11 
I 

CTCAGACAAG 
CGGTTTGTCA 
TGCCCGCGCC 
GGGCACGCGT 
GGTTTCCATT 
AATTAGGGAC 
AGTTTCTGCC 
CGGCGGCGGC 
CTACGCGCTC 
AGGCGCCGGA 
CTGCGCCCCA 
GCGACGGCCG 
GCCGGGGCCA 
CCTCTGATAA 
AGCGCAGGGA 
GCACTCGGGC 
CATGGCGCGG 
CTGTCCCACG 
CATCGTGGCA 
TTTCATCGCA 
GGGACTGAGA 
TCTGAAAAAC 
TAGGAAACAT 
ATGCTCCTGT 
TCAGGATTTG 
ACCCAATTGT 
AAAGTCTATC 
TGTTGGTAAC 
GATAACTAAC 
TGTAGGAGAA 
TCTCGAATCT 
CAAACCAGCG 
TACTAAAATA 
CACT CACATG 
GAAACAGATT 
TTATCCTGAT 
GAACAGAAGT 
CTCGGTCTAT 
GTTTCTGCTT 
TAAGATCCCA 
CTTGTTGGTT 
GAAGTGCTGC 
ATGAAGCCTG 
GGCAGCTAAG 
TCAAATACAA 
TTTTGACCCT 
AAGTTAAAAA 
CATGTAACAC 
TTGACTTTTT 
TGGGACTTGG 
TTAGCTTAGG 
AAACAAAACA 
A CAAG AACAA 
ATTTCAGAAT 
TTATTTGCCC 
ATCTCATGCT 
GAATGGCTGG 
CATACTGTCA 
AG AGGTGG C A 
GCAGCCTTAG 
CATTCACTTT 
GCTTGTCCTG 
TTATCAGGAG 
GACAGTTAGA 
TTATTTTTTT 
TTTAACTAGT 
AT CT TAATAA 
ATATTTTATA 
TT CACAGAAT 



21 
I 

GCTTGCAAAT 
CCCGACCCTC 
TGGCTTCTTC 
TCGCGCACAC 
TCAAAAAGGG 
CGGGAGGCGT 
CCTGCTCTGC 
TCCCGGAATT 
AGTCCCCGGC 
GCCCGGCCTC 
GAGAGTCCCG 
CCGCGGAGCT 
CTGTGAACCC 
GCTGGACTCG 
AGGCCTCCCC 
TGGCACTGGC 
CTCTGGGGCT 
TCCTGCAAAT 
TTTCCGAGAT 
AACCAGAAAA 
AATCTGACAA 
AGCAACCTGC 
TTCCGTCACC 
GACATTATGT 
TACTGCCTGA 
GGTTTGCCAT 
ACATTATCCT 
CTGGTTTCCA 
ATTTCATCCG 
GATCAAGATT 
CCAACCTCAG 
CTTCAGTGGT 
CATGTTACCA 
AACAATGGGG 
TCTGCTCACT 
GTAATTTATG 
AATGAAATCC 
GCTGTGGTGG 
AAGTTGGCAA 
CTGGATGGGT 
GATGCTGCCA 
TTATCTGGGG 
CATATACTGT 
CAGCACCTCA 
AACTGAAATG 
ACTGGACATT 
AAAATTAAAG 
ATATTTTAGT 
CATCTATAAC 
TAGTATTATT 
TCTGAGAGTC 
AAACAAAACA 
GCAGCAACAG 
AACTAAGAGT 
TCTGCGATCC 
GTTTGCATTA 
CCTGCTGTGA 
TACTGCTGGG 
GGTCGCTAAT 
AGCTGTGGAT 
AGCATCACAG 
AAGAGAGGTT 
GACTTCAGAG 
CATGCACACA 
TGGAAATAGT 
CCAACACAGT 
ACCAGGATCC 
CTGCATCCTT 
CCTATGGATT 



31 

I 

GCCCCGCAGC 
CCGGATCGCC 
GTAGCTGGAT 
CCTAGCACAC 
AGACAGCCTC 
CGAACGGAGG 
GTCAGCCCTC 
GGGTTGGAGC 
GGTAGCAGGA 
GAGGTGCATA 
GGAGCGCCGC 
CCGAGCAGCG 
TGCCGCCTGC 
GCACGCCCGC 
GCACGGGTGG 
TGCTAGGGAT 
TCTGCTGGCT 
GCAGTGCCTC 
TGGAGCCTAA 
GGTTAGAAAT 
TTGTGGATTC 
AGCACATCAA 
TTGACTTGTC 
GGATCAAGAC 
ATGAAAGCAG 
CTGCAAATCT 
GTAGTGTGGC 
AACATATGAA 
ATGACAGTGG 
CTGTCAACCT 
ACCACCACTG 
TCTATAACGG 
ATCACACGGA 
ACTACACTCT 
TCATGGGCTG 
AAGATTATGG 
CTTCCACAGA 
TGATTGCGTC 
GACACTCCAA 
AGCTGAAATA 
TGTAAGCTGG 
TTTTCTGGTA 
GAGCTGTGAT 
AGAAAACATG 
AAATCCCATT 
TATTGACTTA 
TTGAGAACAG 
GTGATTTTCT 
ACAGTGACTA 
AAAAGGT TAT 
AAACAATGTT 
AACAAATGAA 
CTGTTTTGTT 
GGAATATATG 
ACCTGCTTTT 
CAGAACTGCA 
GCAGGAGAGG 
TTTTCATGGG 
GAATATATGC 
TTCTGCATCC 
TGACCTTTGT 
TGGCTATCCC 
CCAGGCCTGC 
GACGCCATAG 
TGCACAAATG 
CAGAAACATT 
ATTTAGGTAC 
TACATTAGCC 
GCAGCATTTC 



41 



CATCATT TAA 
TAATTTGTCC 
GCATATCGTG 
ATGAACACGC 
TACCGCGATT 
AACGGTTCAT 
ACGTCACTTC 
AGGAGCCTCG 
GCCTGGACCC 
CCGGACCCCC 
CGGTCGGTGC 
GTAGCGCCCC 
CGGAACACTC 
AACAAGCACC 
GGGAAAGCGG 
GTCGTCCTGG 
GGTTGTGGGC 
TCGGAT CTGG 
CAGTGTAGAT 
CATCAACGAA 
TGGATTAAAA 
TTTTACCCGA 
TGAACTGATC 
TCTCCAAGAG 
CAAGAATATT 
GGCCGCACCT 
AGGTGATCCG 
TGAAACAAGC 
GAAGCAGATC 
CACTGTGCAT 
GTGCATTCCA 
GGCAATATTG 
GTACCACGGC 
AATAGCCAAG 
GCCTGGAATT 
AACTGCAGCG 
CGTCACTGAT 
TGTGGTGGGA 
GTTTGGCATG 
AAGGAAAAGA 
ACTCCTGGGA 
GATGTGGGCG 
TGGGGAACAC 
TTAAATTAAT 
GGATTGTACT 
ATTGCTTCTG 
GTATAAGTGC 
ATACTCTAAT 
AAAGAGTTAA 
TTCCTTCACT 
AAGGATTGTC 
AAACGTTTAA 
GGGGCTATAG 
CATATGGTGA 
TAGAAGTCTG 
GCTTTTCTAC 
AGATTCTAAG 
TAGGAAAGCT 
TTTATAATGT 
CCCCTGAGTC 
ATGCTCTGTT 
CACCCCACCC 
AGCATTTTGT 
CTGGATTGGA 
CTGCAATTTA 
GTTTTGAATC 
CACTTGATAT 
ACTAAATACG 
ACTTGGCTAC 



51 
I 

CTGCACCCGC 60 

CTAGTGAGAC 120 

CTCCGGGCAG 180 

GCAAGAGCTG 240 

GTAGAAGAGA 300 

CTTAGAGACT 360 

GCCAGCAGTA 420 

CTGGCTGCTT 480 

AGGCGCCGCC 540 

ATTCGCATCT 600 

CCGGCGCGCC 660 

CCTGTAAAGC 720 

TTCGCTCCGG 780 

GAGGAGTTAA 840 

CCGGTGCAGC 900 

ATAAGGTGGC 960 

TTCTGGAGGG 1020 

TGCAGCGACC 1080 

CCTGAGAACA 1140 

GATGATGTTG 1200 

TTTGTGGCTC 1260 

AACAAACTGA 132 0 

CTGGTGGGCA 1380 

GCTAAATCCA 1440 

CCCCTGGCAA 1500 

AACCTCACTG 1560 

GTTCCTAATA 162 0 

CACACACAGG 1680 

TCTTGTGTGG 1740 

TTTGCACCAA 1800 

TTCACTGTGA 1860 

AATGAGTCCA 1920 

TGCCTCCAGC 1980 

AATGAGTATG 2040 

GACGATGGTG 2100 

AATGACATCG 2160 

AAAACCGGTC 222 0 

TTTTGCCTTT 22 80 

AAAGGTTTTG 2340 

CAGAGAAAGG 2400 

CTGCTGTTGG 2460 

GTGTTTGGAG 252 0 

CAATGCAGAG 2580 

GCTTCTCTTC 2640 

TCTCTTCTGA 2700 

TTTATTAAAA 2760 

ACACTGAATA 2820 

CAGCACTGAA 2880 

GGGTATATAT 2940 

GTCAATAAAA 30 00 

TTAAAGTTCC 3060 

AAAGAAGAAG 3120 

ATTTAAGTTA 3180 

AATTATAACC 3240 

CCGAGTGAGA 3300 

TCTGAAAAGG 3360 

AAGGATAGTC 3420 

TGTCCTGACC 3480 

CCTTCTTCAT 3540 

TGACCCATGG 3600 

CAGTCTGTGT 3 660 

CACCCCACCC 3720 

TTGAAAACAC 3780 

AACATTGATG 3 840 

GCTTTAAGGT 390 0 

CTCTGTAAAC 3 960 

AAAAAGGAT A 4020 

TTATTGCTTG 4080 

TTCATACCCA 4140 



193 



WO 02/086443 PCT/US02/12476 

TGCCTTAAAG AGGGGCAGTT TCTCAAAAGC AGAAACATGC CGCCAGTTCT CAAGTTTTCC 4200 

TCCTAACTCC ATTTGAATGT AAGGGCAGCT GGCCCCCAAT GTGGGGAGGT CCGAACATTT 4260 

TCTGAATTCC CATTTTCTTG TTCGCGGCTA AATGACAGTT TCTGTCATTA CTTAGATTCC 4320 

GATCTTTCCC AAAGGTGTTG ATTTACAAAG AGGCCAGCTA AT AG CAG AAA TCATGACCCT 4380 

5 GAAAGAGAGA TGAAATTCAA GCTGTGAGCC AGGCAGGAGC TCAGTATGGC AAAGGTTCTT 4440 

GAGAATCAGC CATT TGGTAC AAAAAAGATT TTTAAAGCTT TTATGTTATA CCATGGAGCC 4500 

ATAGAAAGGC TATGGATTGT TTAAGAACTA TTTTAAAGTG TTCCAGACCC AAAAAGGAAA 4560 

AATAAAAAAA AAGGAATATT TGTACCCAAC AGCTAGAAGG ATTGCAAGGT AGATTTTTGT 4620 

TTTAAAATGG AGAGAAGTGG ACAGATAAGG C CAT T T AAT A TATCAAAGAT CAGTTGACAT 4680 
10 CTCCTAGGGA ATGATGAAAA CAGCAGGCTA T 

Seq ID NO: 18 Protein sequence: 
Protein Accession #: CAA53571 

15 1 11 21 31 41 51 

I I 1 I I 1 

MSSWIRWHGP AMARLWGFCW LWGFWRAAF ACPTSCKCSA SRIWCSDPSP GIVAFPRLEP 60 

NSVDPENITE IFIANQKRLE IINEDDVEAY VGLRNLTIVD SGIiKFVAHKA FLKNSNLQHI , 120 

NFTRNKLTSL SRKHFRHLDL SELILVGNPF TCSCDIMWIK TLQEAKSSPD TQDLYCLNES 180 

20 SKNIPLANLQ IPNCGLPSAN LAAPNLTVEE GKSITLSCSV AGDPVPNMYW DVGNLVSKHM 240 

NETSHTQGSL RITNISSDDS GKQISCVAEN LVGEDQDSVN LTVHFAPTIT FLESPTSDHH 300 

WCIPFTVKGN PKPALQWFYN GAILNESKYI CTKIHVTNHT EYHGCLQLDN PTHMNNGDYT 360 

h I AKNE YGKD EKQISAHFMG WPGIDDGANP NYPDVIYEDY GTAANDIGDT TNRSNEIPST 420 
DVTDKTGREH LSVYAWVIA SWGFCLLVM L FIiLKL ARH S KFGMKGFVLF HKIPLDG 

25 

Seq ID NO: 19 DNA sequence 
Nucleic Acid Accession #: NM__000228 
Coding sequence: 82-3600 
30 1 11 21 31 41 51 

I I I I I I 

GCTTTCAGGC GATCTGGAGA AAGAACGGCA GAACACACAG CAAGGAAAGG TCCTTTCTGG 60 

GGATCACCCC ATTGGCTGAA GATGAGACCA TTCTTCCTCT TGTGTTTTGC CCTGCCTGGC 120 

CTCCTGCATG CCCAACAAGC CTGCTCCCGT GGGGCCTGCT ATCCACCTGT TGGGGACCTG 180 

35 CTTGTTGGGA GGACCCGGTT TCTCCGAGCT TCATCTACCT GTGGACTGAC CAAGCCTGAG 240 

ACCTACTGCA CCCAGTATGG CGAGTGGCAG ATGAAATGCT GCAAGTGTGA CTCCAGGCAG 300 

CCTCACAACT ACTACAGTCA CCGAGTAGAG AATGTGGCTT CATCCTCCGG CCCCATGCGC 360 

TGGTGGCAGT CCCAGAATGA TGTGAACCCT GTCTCTCTGC AGCTGGACCT GGACAGGAGA 420 

TTCCAGCTTC AAGAAGTCAT GATGGAGTTC CAGGGGCCCA TGCCCGCCGG CATGCTGATT 480 

40 GAGCGCTCCT CAGACTTCGG TAAGACCTGG CGAGTGTACC AGTACCTGGC TGCCGACTGC 540 

ACCTCCACCT TCCCTCGGGT CCGCCAGGGT CGGCCTCAGA GCTGGCAGGA TGTTCGGTGC 600 

CAGTCCCTGC CTCAGAGGCC TAATGCACGC CTAAATGGGG GGAAGGTCCA ACTTAACCTT 660 

ATGGATTTAG TGTCTGGGAT TCCAGCAACT CAAAGTCAAA AAATT CAAGA GGTGGGGGAG 720 

ATCACAAACT TGAGAGT CAA TTTCACCAGG CTGGCCCCTG TGCCCCAAAG GGGCTACCAC 780 

45 CCTCCCAGCG CCTACTATGC TGTGTCC CAG CTCCGTCTGC AGGGGAGCTG CTTCTGTCAC 840 

GGCCATGCTG ATCGCTGCGC ACCCAAGCCT GGGGCCTCTG CAGGCCCCTC CACCGCTGTG 900 

CAGGTCCACG ATGTCTGTGT CTGCCAGCAC AACACTGCCG GCCCAAATTG TGAGCGCTGT 960 

GCACCCTTCT ACAACAACCG GCCCTGGAGA CCGGCGGAGG GCCAGGACGC CCATGAATGC 1020 

CAAAGGTGCG ACTGCAATGG G C AC T CAGAG ACATGTCACT TTGACCCCGC TGTGTTTGCC 1080 

50 GCCAGCCAGG GGGCATATGG AGGTGTGTGT GACAATTGCC GGGACCACAC CGAAGGCAAG 1140 

AACTGTGAGC GGTGTCAGCT GCACTATTTC CGGAACCGGC GCCCGGGAGC TTCCATTCAG 1200 

GAGACCTGCA TCTCCTGCGA GTGTGATCCG GATGGGGCAG TGCCAGGGGC TCCCTGTGAC 1260 

CCAGTGACCG GGCAGTGTGT GTGCAAGGAG CATGTGCAGG GAGAGCGCTG TGACCTATGC 132 0 

AAGCCGGGCT TCACTGGACT CACCTACGCC AACCCGCAGG GCTGCCACCG CTGTGACTGC 13 80 

55 AACATCCTGG GGTCCCGGAG GGACATGCCG TGTGACGAGG AGAGTGGGCG CTGCCTTTGT 1440 

CTGCCCAACG TGGTGGGTCC CAAAT GTG AC CAGTGTGCTC CCTACCACTG GAAGCTGGCC 1500 

AGTGGCCAGG GCTGTGAACC GTGTGCCTGC GACCCGCACA ACTCCCCTCA GCCCACAGTG 1560 

CAACCAGTTC ACAGGGCAGT GCCCTGTCGG GAAGGCTTTG GTGGCCTGAT GTGCAGCGCT 1620 

GCAGCCATCC GCCAGTGTCC AGACCGGACC TATGGAGACG TGGCCACAGG ATGCCGAGCC 1680 

60 TGTGACTGTG ATTTCCGGGG AACAGAGGGC CCGGGCTGCG ACAAGGC AT C AGGCCGCTGC 1740 

CTCTGCCGCC CTGGCTTGAC CGGGCCCCGC TGTGACCAGT GCCAGCGAGG CTACTGCAAT 1800 

CGCTACCCGG TGTGCGTGGC CTGCCACCCT TGCTTCCAGA CCTATGATGC GGACCTCCGG 1860 

GAGCAGGCCC TGCGCTTTGG TAGACTCCGC AATGCCACCG CCAGCCTGTG GTCAGGGCCT 192 0 

GGGCTGGAGG ACCGTGGCCT GGCCTCCCGG AT CCTAGATG CAAAGAGTAA GATTGAGCAG 1980 

65 ATCCGAGCAG TTCTCAGCAG CCCCGCAGTC ACAGAGCAGG AGGTGGCTCA GGTGGCCAGT 2 040 

GCCATCCTCT CCCTCAGGCG AACTCTCCAG GGCCTGCAGC TGGATCTGCC CCTGGAGGAG 210 0 

GAGACGTTGT CCCTTCCGAG AGACCTGGAG AGTCTTGACA GAAGCTTCAA TGGTCTCCTT 2160 

ACTATGTATC AGAGGAAGAG GGAGCAGTTT GAAAAAATAA GCAGTGCTGA TCCTTCAGGA 222 0 

GCCTTCCGGA TGCTGAGCAC AGCCTACGAG CAGTCAGCCC AGGCTGCTCA GCAGGTCTCC 2280 

70 GACAGCTCGC GCCTTTTGGA CCAGCTCAGG GACAGCCGGA GAGAGGCAGA GAGGCTGGTG 2340 

CGGCAGGCGG GAGGAGGAGG AGGCACCGGC AGCCCCAAGC TTGTGGCCCT GAGGCTGGAG 2400 

ATGTCTTCGT TGCCTGACCT GACACCCACC TTCAACAAGC TCTGTGGCAA CTCCAGGCAG 2460 

ATGGCTTGCA CCCCAATATC ATGCCCTGGT GAGCTATGTC CC CAAGA CAA TGGCACAGCC 2520 

TGTGGCTCCC GCTGCAGGGG TGTCCTTCCC AGGGCCGGTG GGGCCTTCTT GATGGCGGGG 2580 

75 CAGGTGGCTG AGCAGCTGCG GGGCTTCAAT GCCCAGCTCC AGCGGACCAG GCAGATGATT 2640 

AGGGCAGCCG AGGAATCTGC CTCACAGATT CAATCCAGTG CCCAGCGCTT GGAGACCCAG 2700 

GTGAGCGCCA GCCGCTCCCA GATGGAGGAA GATGTCAGAC GCACACGGCT CCTAATCCAG 2760 

CAGGTCCGGG ACTTCCTAAC AGACCCCGAC ACTGATGCAG CCACTATCCA GGAGGT CAGC 2 820 

• GAGGCCGTGC TGGCCCTGTG GCTGCCCACA GACTCAGCTA CTGTTCTGCA GAAGATGAAT 2880 

80 GAGATCCAGG CCATTGCAGC CAGGCTCCCC AACGTGGACT TGGTGCTGTC CCAGACCAAG 2 940 

CAGGACATTG CGCGTGCCCG CCGGTTGCAG GCTGAGGCTG AGGAAGCCAG GAGCCGAGCC 3000 

CATGCAGTGG AGGGCCAGGT GGAAGATGTG GTTGGGAACC TGCGGCAGGG GACAGTGGCA 3060 

CTGCAGGAAG CTCAGGACAC CATGCAAGGC ACCAGCCGCT CCCTTCGGCT TATCCAGGAC 312 0 

AGGGTTGCTG AGGTTCAGCA GGTACTGCGG C CAG CAG AAA AGCTGGTGAC AAGCATGACC 3180 

85 AAGCAGCTGG GTGACTTCTG GACACGGATG GAGGAGCT CC GCCACCAAGC CCGGCAGCAG 3240 

GGGGCAGAGG CAGTCCAGGC CCAGCAGCTT GCGGAAGGTG CCAGCGAGCA GGCATTGAGT 3300 

GCCCAAGAGG GATTTGAGAG AATAAAACAA AAGTATGCTG AGTTGAAGGA CCGGTTGGGT 3360 



194 



10 



WO 02/086443 

CAGAGTTCCA TGCTGGGTGA 
GAGCTGTTTG GGGAGACCAT 
CTGCGGGGCA GCCAGGCCAT 
GTGGAGCAGA TCCGTGACCA 
TGCTACAGCT TCCAGCCCGT 
GATTGGGTTG GAATGCTTTC 
GACCACCCCT GGTGTGTAGC 
GGGACAGTTA CACTTGACAG 
CTCTCAAGTC AAGGAAGCTG 
GGAATCCTGG ACCAAGCACA 
AAAATCTTTG G 
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GCAGGGTGCC 
GGAGATGATG 
CATGCTGCGC 
CAT CAATGGG 
TGCCCCACTC 
CATCTCCAGG 
TAGTAAGATT 
ACAAAGATGG 
GGCTGGGCAG 
AAAACTTAAC 



CGGATCCAGA 
GACAGGATGA 
TCGGCGGACC 
CGCGTGCTCT 
ATCTGCCGCC 
AGACTTTCAT 
ACCCTGAGCT 
TGGAGATTGG 
TATCCCCCGC 
AAAAGTGATG 



GTGTGAAGAC 
AAGACATGGA 
TGACAGGACT 
ACTATGCCAC 
TTTGCTTTTG 
GCAGCCTAAA 
GCAGCTGAGC 
CATGCCATTG 
CTTTAGTTCT 
TAAAAATGAA 



AGAGGCAGAG 3420 

GTTGGAGCTG 3480 

GGAGAAGCGT 3540 

CTGCAAGTGA 3 600 

GTTGGGGGCA 3 660 

GTACAGCCTG 3720 

CTGAGCCAAT 3780 

AAACTAAGAG 3840 

CCACTGGGGA 3 900 

AAGCCAAATA 3 960 



15 



Seq ID NO: 20 Protein sequence: 
Protein Accession #: NP 000219 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



MRPFFLLCFA 
EWQMKCCKCD 
MEFQGPMPAG 
NARLNGGKVQ 
VSQLRLQGSC 
PWRPAEGQDA 
HYFRNRRPGA 
TYANPQGCHR 
CACDPHNSPQ 
TEGPGCDKAS 
RLRNATASLW 
TLQGLQLDLP 
AYEQSAQAAQ 
TPTFNKLCGN 
GFNAQLQRTR 
DPDTDAAT I Q 
RLQAEAEEAR 
VLRPAEKLVT 
IKQKYAELKD 
MLRSADLTGL 



11 

LPGLLHAQQA 
SRQPHNYYSH 
MLIERSSDFG 
LNLMDLVSGI 
F CHGHADR C A 
HE CQRCDCNG 
SIQETCISCE 
CDCNILGSRR 
PTVQPVHRAV 
GRCLCRPGLT 
SGPGLEDRGL 
LEEETLSLPR 
QVSDSSRLLD 
SRQMACTPIS 
QMIRAAEESA 
EVSEAVLALW 
SRAHAVEGQV 
SMTKQLGDFW 
RLGQSSMLGE 
EKRVEQIRDH 



21 



CSRGACYPPV 
RVENVASSSG 
KTWRVYQYLA 
PATQSQKIQE 
PKPGASAGPS 
HSETCHFDPA 
CDPDGAVPGA 
DMPCDEESGR 
PCREGFGGLM 
GPRCDQCQRG 
ASRILDAKSK 
DLESLDRSFN 
QLRDSRREAE 
CPGELCPQDN 
SQIQSSAQRL 
LPTDSATVLQ 
EDWGNLRQG 
TRMEELRHQA 
QGARIQSVKT 
I NGRVLY YAT 



31 
I 

GDLLVGRTRF 
PMRWWQSQND 
ADCTSTFPRV 
VGE I TNLRVN 
TAVQVHDVCV 
VFAASQGAYG 
PCDPVTGQCV 
CLCLPNWGP 
CSAAAIRQCP 
YCNRYPVCVA 
IEQIRAVLSS 
GLLTMYQRKR 
RLVRQAGGGG 
GTACGSRCRG 
ETQVSASRSQ 
KMNEIQAIAA 
TVALQEAQDT 
RQQGAEAVQA 
EAEELFGETM 
CK 



41 
I 

LRASSTCGLT 
VNPVSLQLDL 
RQGRFQSWQD 
FTRLAPVPQR 
CQHNTAGPNC 
GVCDNCRDHT 
CKEHVQGERC 
KCDQ CAP YHW 
DRTYGDVATG 
CHPCFQTYDA 
PAVTEQEVAQ 
EQFEKISSAD 
GTGSPKLVAL 
VLPRAGGAFL 
MEEDVRRTRL 
RLPNVDLVLS 
MQGTSRSLRL 
QQLAEGASEQ 
EMMDRMKDME 



51 
I 

KPETYCTQYG 
DRRFQLQEVM 
VRCQSLPQRP 
GYHPPSAYYA 
ERCAPFYNNR 
EGKNCERCQL 
DLCKPGFTGIi 
KLASGQGCEP 
CRACD CDFRG 
DLREQALRFG 
VASAILSLRR 
PSGAFRMLST 
RLEMSSLPDL 
MAGQVAEQLR 
LIQQVRDFLT 
QTKQDIARAR 
IQDRVAEVQQ 
ALSAQEGFER 
LELLRGSQAI 



Seq ID NO: 21 DNA sequence 

Nucleic Acid Accession #: NMJD03722 

Coding sequence: 145-1491 



85 



i 
I 

TCGTTGATAT 
ACAGTACTGC 
AAAGAAAGTT 
CCAGAGGT TT 
ATTGACTTGA 
AGCATGGACT 
ACGAACCTGG 
AGTCCCTATA 
CCCAGCTCCA 
CCAGGCCCGC 
TGGACGTATT 
CAGATCAAGG 
AAAAAAGCTG 
GAATTCAACG 
CATGCCCAGT 
CCACCCCAGG 
TGTGTTGGAG 
GGGCAAGTCC 
AGGAAGGCGG 
GATGGTACGA 
AAACGAAGAT 
GAAATGCTGT 
ATTGAAACGT 
CTTTCAGCCT 
GACGTCTTCT 
TCTATATTTT 
TGTGTGTGCG 
CCCAACTGCT 
TTACAAGAAA 
GAACCACTGT 
GAAAGGGGCA 
AATTCACAGG 
AAAAAAGTTG 
CCCTTTTAAT 
TACTGCTGGG 
TTTGTGAGAA 
GCTGTGTACC 
CATGAAACCC 
CTCATTTTGT 
TGTTTACCAT 
AATTTGCTTA 
CTGATACTGT 
AGACGTGT TA 



11 
I 

CAAAGACAGT 
CCTGACCCTT 
AT T ACCG AT C 
TCCAGCATAT 
ACTTTGTGGA 
GTATCCGCAT 
GGCTCCTGAA 
ACACAGACCA 
CCTTCGATGC 
ACAGTTT CG A 
CCACTGAACT 
TGATGACCCC 
AGCACGTCAC 
AGGGACAGAT 
ATGTAGAAGA 
TTGGCACTGA 
GGATGAACCG 
TGGGCCGACG 
ATGAAGATAG 
AGCGCCCGTT 
CCCCAGATGA 
TGAAGAT CAA 
ACAGGCAACA 
GCTTCAGGAA 
TTAGACATTC 
AAGTGTGTGT 
TGTGTATCTA 
CAAAGGCACA 
GGATGTTTTC 
GTTTGTCTGT 
TTAAGATGTT 
GAAGCTTTTG 
TTATTGTCTG 
GCTGGTCATG 
CAGCGAGGTG 
CTTGCATTAT 
TGCCTCTGCC 
TGGAAGACCT 
GCTTTTAATA 
TATTCAAAGC 
ATTAGAGCTT 
TCAGTGCATT 
AAATCAGCAC 



21 

I 

TGAAGGAAAT 
ACATCCAGCG 
CACCATGTCC 
CTGGGATTTT 
TGAACCATCA 
GCAGGACTCG 
CAGCATGGAC 
CGCGCAGAAC 
TCTCTCTCCA 
CGTGTCCTTC 
GAAGAAACTC 
ACCTCCTCAG 
GGAGGTGGTG 
TGCCCCTCCT 
TCCCATCACA 
ATTCACGACA 
CCGTCCAATT 
CTGCTTTGAG 
CATCAGAAAG 
TCGT CAGAAC 
TGAACTGTTA 
AGAGTCCCTG 
GCAACAGCAG 
TGAGCTTGTG 
CAAGCCCCCA 
GTTGTATTTC 
GCCCTCATAA 
AAGCCACTAG 
TGCAGATTTT 
GAGCTTTCTG 
TATTGGAACC 
AGCAGGTCTC 
TG CATAAGT A 
TAATAATATT 
ATCATTACCA 
TTGTGTCCTC 
ACTGTATGTT 
ACTACAAAAA 
GAAAGACAAA 
TCAAAATAGA 
CTATCCCTCA 
TAGCCAGGAG 
TCCTGGACTG 



31 
t 

GAATTTTGAA 
TTTCGTAGAA 
CAGAGCACAC 
CTGGAACAGC 
GAAGATGGTG 
GACCTGAGTG 
CAGCAGATT C 
AGCGTCACGG 
TCACCCGCCA 
CAGCAGTCGA 
TACTGCCAAA 
GGAGCTGTTA 
AAGCGGTGCC 
AGTCATTTGA 
GGAAGACAGA 
GTCTTGTACA 
TTAATCATTG 
GCCCGGATCT 
CAGCAAGTTT 
ACACATGGTA 
TACTTACCAG 
GAACTCATGC 
CAGCACCAGC 
GAGCCCCGGA 
AACCGATCAG 
CATGTGTATA 
ACAGGACTTG 
TGAGAGAATC 
GTATCCTTAG 
TTGTTTCCTG 
CTTTTCTGTC 
AAACTTAAGA 
AGTTGTAGGT 
G CAAGTAGTA 
AAAGTAAT C A 
CCCTCATGTG 
GGCATCTGTT 
AACTGTTGTT 
TCCACCCCAG 
ATTTGAAGCC 
AGCCTACCTA 
ACTTACGTTT 
GAAATTAAAG 



41 
1 

ACTTCACGGT 
ACCCAGCTCA 
AGACAAATGA 
CTATATGTTC 
CGACAAACAA 
ACCCCATGTG 
AGAACGGCTC 
CGCCCTCGCC 
TCCCCTCCAA 
GCACCGCCAA 
TTGCAAAGAC 
TCCGCGCCAT 
CCAACCATGA 
TTCGAGTAGA 
GTGTGCTGGT 
ATTTCATGTG 
TTACTCTGGA 
GTGCTTGCCC 
CGGACAGTAC 
TCCAGATGAC 
TGAGGGGCCG 
AGTACCTTCC 
ACTTACTTCA 
GAGAAACTCC 
TGTACCCATA 
TGTGAGTGTG 
AAGACACTTT 
TTTTGAAGGG 
ACCGGCCATT 
GGAGGGAGGG 
TTCTTCTGTT 
TGTCTT T TT A 
GACTGAGAGA 
AGAAACGAAG 
ACTTTGTGGG 
TAGGTAGAAC 
ATGCTAAAGT 
TGGCCCCCAT 
TAATATTGCC 
CTCTCACAAA 
CCATAAAACC 
TGAGTAAGTG 
ATTGAAAGGG 



51 
I 

GTGCCACCCT 
TTTCTCTTGG 
ATTCCTCAGT 
AGTTCAGCCC 
GATTGAGATT 
GCCACAGTAC 
CTCGTCCACC 
CTACGCACAG 
CACCGACTAC 
GTCGGCCACC 
ATGCCCCATC 
GCCTGTCTAC 
GCTGAGCCGT 
GGGGAACAGC 
ACCTTATGAG 
TAACAGCAGT 
AACCAGAGAT 
AGGAAGAGAC 
AAAGAACGGT 
ATCCAT CAAG 
TGAGACTTAT 
TCAGCACACA 
GAAACATCTC 
AAAACAATCT 
GAGCCCTATC 
TGTGTGTGTA 
GGCT CAGAGA 
ACTCAAACCT 
GGTGGGTGAG 
GTCAGGTGGG 
GTTTTTCTAA 
AGAAAAGGAG 
CTCAGTCAGA 
GTGTCAAGTG 
TGGAGAGTTC 
ATTTCTTAAT 
TTTTCTTGTA 
AGCAGGTGAA 
CTTACGTAGT 
ATCTGTGATT 
AGCCATATTA 
AGATCCAAGC 
TAGACTACTT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 



195 



WO 02/086443 

TTCTTTTTTT TACTCAAAAG TTTAGAGAAT CTCTGTTTCT TTCCATTTTA AAAACATATT 2 640 

TTAAGATAAT AGCATAAAGA CTTTAAAAAT GTTCCTCCCC TCCATCTTCC CACACCCAGT 2 700 

CACCAGCACT GTATTTTCTG TCACCAAGAC AATGATTTCT TGTTATTGAG GCTGTTGCTT 2760 
TTGTGGATGT GTGATT TTAA TTTTCAATAA ACTTTTGCAT CTTGGTTTAA AAGAAA 



PCT/US02/12476 



Seq ID NO: 22 Protein sequence: 
Protein Accession #: NP 003713 
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MSQSTQTNEF 
DSDLSDPMWP 
SPSPAIPSNT 
PQGAVIRAMP 
ITGRQSVLVP 
FEARICACPG 
LLYLPVRGRE 
LVEPRRETPK 



11 
I 

LSPEVFQHIW 
QYTNLGLLNS 
DYPGPHSFDV 
VYKKAEHVTE 
YEPPQVGTEF 
RDRKADEDSI 
TYEMLLKIKE 
QSDVFFRHSK 



21 

1 

DFLEQPICSV 
MDQQIQNGSS 
SFQQSSTAKS 
WKRCPNHEL 
TTVLYNFMCN 
RKQQVSDSTK 
SLELMQYLPQ 
PPNRSVYP 



31 
I 

QPIDLNFVDE 
STSPYNTDHA 
ATWTYSTELK 
SREFNEGQIA 
SSCVGGMNRR 
NGDGTKRPFR 
HTIETYRQQQ 



41 



PSEDGATNKI 
QNSVTAPSPY 
KLYCQIAKTC 
PPSHLIRVEG 
PILIIVTLET 
QNTHGIQMTS 
QQQHQHLLQK 



51 

I 

EISMDCIRMQ 
AQPSSTFDAL 
PIQIKVMTPP 
NSHAQYVEDP 
RDGQVLGRRC 
IKKRRSPDDE 
HLLSACFRNE 



Seq ID NO: 2 3 DNA sequence 

Nucleic Acid Accession #: NM_001944.1 

Coding sequence: 84-3083 



80 



TTTTCTTAGA 
TTT CACCAGG 
CCATCTTCGT 
ATGATGAAGA 
AATTTGCCAA 
T T AC T T C AG A 
ATCAGCCGCC 
CTATAGTCGA 
AAGGACTAGA 
ATCCTCCAGT 
ACTCACTGGT 
AAATTGCCTT 
G AAACACTG G 
ATCGTCTGGT 
GTAATATTAA 
CAG CACGT AT 
TGGATGAAGA 
GAAATTGGTT 
AGGCTCTAGA 
CTGAATTTCA 
AGGTAATAAA 
AAAAAGG CAT 
ATGAGGACAC 
GATACCTAAT 
ATTCTACTTT 
CGGGTAAAAC 
CAACAGCTGT 
CTAGAACACT 
TAAAGTTGCC 
CCCAGGAACA 
ACAATCGGTG 
GCATCTGTGG 
CAGGGAGGCT 
TGGCCCCCCT 
GTGGTTTTAT 
GAGCCCATCC 
GAGCCGATTT 
TGGAAGGCAC 
GTGCTGCAGG 
CTGGAGTTGG 
GAGGAACCAA 
TTTCTCAGAA 
TGTTGATCTA 
GTTGCAGTTT 
TTAAAAAACT 
CCTCTAAAGA 
CAGGATTTGT 
CTGGGTCTGT 
TAACGGAGAC 
CACTTCTCAC 
CTGG CAACCT 
ATCCTTGCTC 
ATCTTTGGAC 
TGGCACTTAT 
TACCCCAAAA 
TCTTAAAGTT 



11 

I 

CATTAACTGC 
G AAAT CAG AG 
GGTGGTCATA 
AGAGATGACT 
ACCCTG CAG A 
TTACCAAGCA 
TTTTGGAATC 
CCGGGAGGAA 
TGTAGAGAAA 
ATTTT CACAA 
GATGATACTA 
CAAAATTGTC 
GGAAGTCCGT 
TGTGAGTGGT 
AGTGAAAGAT 
TGAAGAAAAT 
GTACACAGAT 
TGAAATACAA 
TTATGAACAA 
CCAATCAGTT 
TGTAAGAGAA 
AAGTAGCAAA 
TAACAAAGCT 
GATTGATT C A 
CATAGTTAAC 
TTCTACAGGC 
CCTCGAAAAA 
GAATAATAGA 
TGCCGTATGG 
GATACCTCCT 
TGAGATGCCA 
AACTTCTTAC 
GGGGCCTGCC 
TCTGCTGTTG 
CCCAGTTCCT 
TGAAGACAAG 
CATGGAAAGT 
TTCAGGAATG 
CTTTGCAACA 
CATCTGTTCC 
TAAGGACTAC 
AGCATTTGCC 
TGATAATGAA 
TATTGCTGAT 
TGCAGAGATA 
CAGCGGTTAT 
TAAGTGCCAG 
CCAGCCAGCT 
TTACTCGGCT 
ACAAAATGTG 
AGCTGGCCCA 
CCGTCTAATA 
TAAAGTAT T C 
TAGCTTCTCT 
GCAATATGTT 
TTTCAAAACC 



21 

i 

AGACGGCTGG 
ACAATGATGG 
TTGGTTCATG 
ATGCAACAAG 
GAAGGAGAAG 
ACCCAGAAAA 
TTTGTTGTTG 
ACTCCAAGCT 
CCACTTATAC 
CAAATTTTCA 
AATGCCACAG 
T CT CAGGAAC 
ACTTTGACCA 
GCAGACAAAG 
GTCAACGATA 
ATTTTAAGTT 
AATTGGCTTG 
ACTGATCCTA 
CTACAAAGCG 
AT CTCT CGAT 
GGAATTGCAT 
AAATTGGTGG 
GCCTCAAATG 
AAAACTGCTG 
AAAACAATCA 
ACGGTATATG 
GATGCAGTTT 
TACACTGGCC 
AGT AT CACAA 
GGAGTATACC 
CGCAGCTTGA 
CCAACCACAA 
GCCATCGGCC 
ACCTGTGACT 
GATGGCTCAG 
GAAATCACAA 
TCTGAAGTTT 
GAAATGACCA 
GGGACAGTGT 
TCAGGGCAGT 
GCTGATGGGG 
TGTGCGGAGG 
GGCGCAGATG 
GACCTGGATG 
AGCCTTGGTG 
GGGATTGAAT 
ACTTTGTCAG 
GTTTCCATCC 
TCTGGTTCCC 
ATAGTGACAG 
ACGCAGCTAC 
TGACCAGAAT 
AAAATAGCAT 
CATAAACTGA 
GTCACTCCTA 
CTAAAATCAT 



31 

I 

CAGGATAGAA 
GGCTCTTCCC 
GAGAATTGCG 
CTAAAAGAAG 
ATAACTCAAA 
TCACCTACCG 
ACAAAAACAC 
TCCTGATCAC 
TAACGGTTAA 
TGGGTGAAAT 
ATGCAGATGA 
CAGCAGGCAC 
ATTCTCTTGA 
ATGGAGAAGG 
ACTTCCCAAT 
CTGAATTACT 
CAGTAT ATT T 
GAACTAATGA 
TGAAACTTAG 
ACCGAGTTCA 
TCCGTCCTGC 
ATTATATCCT 
TCAAATATGT 
AAATCAAATT 
CAGCTGAGGT 
TTAGAGTACC 
GCAGTTCTTC 
CCTATACATT 
CCCTCAATGC 
ACATCTCCCT 
CACTGGAAGT 
GCCCTGGGAC 
TGCTGCTCCT 
GTGGGGCAGG 
AAGGAACAAT 
ATATTTGTGT 
GTACAAATAC 
CTAAGCTTGG 
CAGGAGCTGC 
CTGGAACCAT 
CGATAAGCAT 
AAGACGATGG 
CCACTGGTTC 
ACAGCTTCTT 
TTGATGGTGA 
CCTGTGGCCA 
GAAGT CAAGG 
CTGACCCTCT 
TCGTGCAACC 
AAAGGGTGAT 
GAGGGTCACA 
GAGCTGGAAT 
AGCAAAGCTC 
TCACGATTAT 
ATTCTCAAGT 
ATTCGC 



41 
I 

GCAGCGGCTC 
CAGAACTACA 
AATAGAGACT 
GCAAAAACGT 
AAGAAACCCA 
AATCTCTGGA 
TGGAGATATT 
ATGTCGGGCT 
AATTTTGGAT 
TGAAGAAAAT 
ACCAAACCAC 
ACCCATGTTC 
CCGAGAGCAA 
ACTATCAACT 
GTTTAGAGAC 
TCGATTTCAA 
CTTTACCTCT 
AGGCATCCTG 
TATTGCTGTC 
GTCAACCCCA 
TTCCAAGACA 
GGGAACATAT 
CATGGGACGT 
TGTCAAAAAT 
TCTGGCCATA 
CGATTTCAAT 
ACCTTCCGTG 
TGCACTGGAA 
TACCTCGGCC 
GGTACTTACA 
CTGTCAGTGT 
CAGGTATGGC 
TGGTCTCCTG 
TTCTACTGGG 
TCATCAGTGG 
GCCTCCTGTA 
GTATGCCAGA 
AGCAGCCACT 
TTCAGGATTC 
GAGAACAAGG 
GAATTTTCTG 
CCAGGAAGCA 
TCCTGTGGGC 
GGACTCACTT 
AGGCAAAGAA 
TCCCATAGAA 
AGCTTCTGCT 
GCAGCATGGT 
TTCCACTGCA 
CTGTCCCATT 
TACTATGCTC 
ACCACACTGA 
ACTGTATTGG 
AAATTAAATG 
ACTATTCAAA 



51 
I 

ACTTGGACTT 
GGGGCTCTGG 
AAAGGT CAAT 
GAATGGGTGA 
ATTGCCAAGA 
GTGGGAATCG 
AACATAACAG 
CTAAATGCCC 
ATTAATGATA 
AGTGCCTCAA 
TTGAATTCTA 
CTCCTAAGCA 
GCTAGCAGCT 
CAATGTGAAT 
TCTCAGTATT 
GTAACAGATT 
GGGAATGAAG 
AAAGTGGTGA 
AAAAACAAAG 
GTCACAATT C 
TTTACTGTGC 
CAAGCCATCG 
AACGATGGTG 
ATGAACCGAG 
GATGAATACA 
GACAATTGTC 
GTTGTCTCCG 
GATCAACCTG 
CTCCTCAGAG 
GAC AGT CAG A 
GACAACAGGG 
AGGCCGCACT 
CTGCTGCTGT 
GGAGTGACAG 
GGAATTGAAG 
ACAGCCAATG 
GGCACAGCGG 
GAATCTGGAG 
GGAGCAGCCA 
CATTCCACTG 
GACTCCTACT 
AATGACTGCT 
TCCGTGGGTT 
GGACCCAAAT 
GTTCAGCCAC 
GTCCAGCAGA 
TTGTCCGCCT 
AACTATTTAG 
GGCTTTGATC 
TCCAGTGTTC 
TGTACAGAGG 
CCAAATCTGG 
GCTAATAATT 
TTTGGGTTCA 
TTGTAGTAAA 



60 
120 
180 
240 
300 
360 
420 



60 
120 
180 
240 
300 
360 
42 0 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 



85 



Seq ID NO: 24 Protein sequence: 
Protein Accession #: NP 001935.1 



11 



21 



31 



41 



51 



196 



WO 02/086443 



PCT/US02/12476 



I 



10 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



MMGLFPRTTG 
GEDNSKRNPI 
PSFLITCRAL 
ATDADEPNHL 
DKDGEGLSTQ 
WLAVYFFTSG 
SRYRVQSTPV 
SNVKYVMGRN 
VYVRVPD FND 
I TTLNATSAL 
TTSPGTRYGR 
GSEGTIHQWG 
MTTKLGAATE 
DGAISMNFLD 
LDDSFLDSLG 
LSGSQGASAL 
VTERVICPIS 



ALAIFWVIL 
AKITSDYQAT 
NAQGLDVEKP 
NSKIAFKIVS 
CECNIKVKDV 
NEGNWFE I QT 
TIQVINVREG 
DGGYLMIDSK 
NCPTAVLEKD 
LRAQEQIPPG 
PHSGRLGPAA 
IEGAHPEDKE 
SGGAAGFATG 
SYFSQKAFAC 
PKFKKLAEIS 
SASGSVQPAV 
SVPGNLAGPT 



VHGEIiRIETK 
QKITYRISGV 
LILTVKILDI 
QEPAGTPMFL 
NDNFPMFRDS 
DPRTNEG ILK 
IAFRPASKTF 
TAEIKFVKNM 
AVCSSSPSW 
VYHISLVLTD 
IGLLLLGLLL 
ITNICVPPVT 
TVSGAASGFG 
AEEDD GQEAN 
LGVDGEGKEV 
SIPDPLQHGN 
QLRGSHTMLC 



i 

GQYDEEEMTM 
GIDQPPFGIF 
NDNPPVFSQQ 
LSRNTGEVRT 
QYSARIEENI 
WKALDYEQL 
TVQKGISSKK 
NRDSTFIVNK 
VSARTLNNRY 
SQNNRCEMPR 
LLLAPLLLLT 
ANGADFMESS 
AATGVGICSS 
DCLLIYDNEG 
QPPSKDSGYG 
YLVTETYSAS 
TEDPCSRLI 



QQAKRRQKRE 
WDKNTGDIN 
IFMGEIEENS 
LTNSLDREQA 
LSSELLRFQV 
QSVKLSIAVK 
LVDYILGTYQ 
TITAEVLAID 
TGPYTFALED 
SLTLEVCQCD 
CDCGAGSTGG 
EVCTNTYARG 
GQSGTMRTRH 
ADATGSPVGS 
IESCGHPIEV 
GSLVQPSTAG 



WVKFAKPCRE 
ITAIVDREET 
ASNSLVMILN 
SSYRLWSGA 
TDLDEEYTDN 
NKAEFHQSVI 
AIDEDTNKAA 
EYTGKTSTGT 
QPVKLPAVWS 
NRGICGTSYP 
VTGGFIPVPD 
TAVEGTSGME 
STGGTNKDYA 
VGCCSFIADD 
QQTGFVKCQT 
FDPLLTQNVI 



Seq ID NO: 25 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 56-1642 



75 



AGTATCCCAG 
GCAAGGGATC 
CATGTTTGAG 
CTGCTCTGTC 
GGAGAAGGTG 
GGAAGATCAG 
GGACTCTTTT 
CTTTTCCCAG 
GGAGATGGTA 
TAACTCAGGG 
GTCCCTGGCG 
GCCCTTGCTC 
GAAGAAGCTG 
GAGGAGTGTC 
TGGGCTCTCT 
ATGGGCACAG 
GATCT CATTC 
ACAGCGCAAG 
AGATCTCAAC 
TCGTAAGAAC 
CATCTTCTCA 
CGAGCTGTCA 
ACGGTTGAAG 
TGCCCTTCGT 
CAAGT TGACT 
CAATGTGAAT 
CATTGCTAGC 
ACTCGTTCAT 
CAGACACAGG 
AGGAGCTCCT 
AGCTACAGCT 
AACAGCGGGA 
TGTATGAAGA 
TTCAGGAGCG 
AGTCAGTGGC 
CAGCTTCTGC 
CAGAGCTAAA 
CCTCAGCCAA 
TAAGGCTGTT 
CTTGTTGCCA 
TCTTAATCAA 
TGGACCTTCG 
AAGGCCAGGT 
AACAACCACC 
AAAGCTCAAC 
TCAAATCTGG 
GGCCCTGAGG 
TAT CAGGAAT 
TATAACCACC 
GCACACAAAA 
GTAGCAAAAT 



11 
I 

GAGGAGCAAG 
CTTTCTCCGC 
TCCACAGCTG 
GTGTCTACCT 
AAAGTATACT 
GGTTGTGTCC 
GCCCTGAAGA 
ATCTTTGGGC 
AAGGATGTAC 
AAAACCCACA 
CTGATCTTCA 
TCCAATGAGG 
TCCCTGCTAA 
TACAT CGAAA 
TCTATCAGTC 
CCAGACACTG 
TTTGAGATCT 
AGGCAGACTT 
TGGATT CATG 
CAGAGCTTTG 
AT CAGGATCC 
CTCTGTGATC 
GAAGCAGGAA 
CAAAACCAGC 
CGAGTGTTCC 
CCCTGTGCAT 
CAGGTGACTT 
CAAGGAACAT 
CCTTGATGAT 
ACAAGTTGTG 
GGAGATGCAT 
ACAGTGGTGC 
AAAACTAAAT 
GGATGAAAAG 
CCATCAGCAA 
CTCCACCCAG 
CTCTACCACT 
GCCCTTCACC 
GCGGACAGAG 
CAGCACTGGG 
ACAGGACCAG 
GAAGAAGGCA 
TTCTGCCAAA 
AGGGAAGAAA 
AGACTGCAGC 
GCCTTTTGGC 
TGGGTCAGCT 
TATATCCAGG 
TATGTAATCT 
ACAGTTATAT 
CATTAAAACA 



21 



TGGCACGTCT 
CAGCGGGCTT 
CAGATTTGGG 
CCCTAGAGGA 
TGAGGGTTAG 
GTATTGAGAA 
GCAATGAACG 
CAGAAGTGGG 
TCAAAGGGCA 
CGATTCAAGG 
ATAGCCTCCA 
TAATCTGGCT 
ATGGAGGCCT 
GTCGGATAGG 
AGTGTACCAG 
CCCCACTACC 
ACAACGAACT 
TGCGGCTATG 
TGCAAGATGC 
CCAGCACCCA 
TACACCTTCA 
TGGCTGGCTC 
ACATTAACAC 
AGAACCGGTC 
AAGGTTTCTT 
CTACCTATGA 
GTGCATGCCC 
AGTCTTCAGG 
GATATTGAAA 
GAAGCCATGA 
CTCCGAGATG 
AGTGAACATT 
ATCCTCAAGG 
ATTGAAGAGC 
TCAGGGTCTG 
CAGCTTCAGG 
GAAGAGTTGC 
ATTGATGTGG 
CTTCAGAAAC 
GCAGGAAAAC 
ACTCTGGCTG 
GCATGTATTG 
AAGCGCCTTG 
CCATTCCTTC 
CCTTATGCCC 
AAAAAGTACT 
ACTCTCCTGA 
ATGCAATACT 
CATGTTGTTG 
TAAAGATATT 
AATTATAAAA 



31 
I 

TCGGACCTAG 
GCTGTCCGAT 
GT CTGTGGT A 
CAAGCAGCAG 
GCCCTTGTTA 
TGTGGAGACC 
GGGAATTGGC 
ACAGGCATCC 
GAACTGGCTC 
TACCATCAAG 
AGGCCAACTT 
AGACAGCAAG 
CCAAGAGGAG 
TACCAGCACC 
CAGTAGCCAG 
TGTCCCGGCA 
GCTTTATGAC 
CGAGGATCAA 
TGAGGAGGCC 
CCTCAACCAG 
GGGGGAAGGA 
AGAGCGCTGC 
CTCTCTACAC 
AAAGCAGAAC 
CACAGGCCGA 
TGAAACTCTT 
CACCTATGCA 
TATCCCCCAG 
ATGAAGCTGA 
AGACACTGCT 
AAATTTGCAA 
TGGACACCCA 
AGTCACTGAC 
TAG AAGCT CT 
AATTGGCCCT 
AGGTTAAAGC 
ATAAGTATCA 
ACAAGAAGTT 
TTGGTGAGTC 
TTCGTCAAGC 
AACTGCAGAA 
CTGAGCAGTA 
GTACCAACCA 
GAAATTTACT 
GG AT CCTACG 
AAGGCTGTGG 
AGAAATAGGT 
CAGACACTAG 
TTTTTTTTTA 
ATTGTTCACA 
GGGACAGAAA 



41 
I 

GCTGCCCCTG 
GACGATGTCG 
CGCAAGAACC 
GTTCCATCTG 
CCTTCAGAGT 
CTTGTTCTAC 
CAAGCCACAC 
TTCTTCAACC 
ATCTATACAT 
GATGGAGGGA 
CATCCAACAC 
CAGAT CCGAC 
GAGCTGTCCA 
AGCTTCGACA 
CTGGATGAAA 
AACATTCGCT 
CTATTAGAAC 
AATGGCAATC 
TGGAAGCTCC 
AACTCCAGCC 
GATATAGTCC 
AAAGATCAGA 
ACCCTGGGCC 
CTGGTTCCCT 
GGCCGTTCCT 
CATGTGGCCA 
ACTGGGATTC 
CTTAGAGAAA 
CATCTCCATG 
TTTGAAGGAA 
TGAGATGGTA 
AAAGGAACTA 
AAGTTTTTAC 
CTTGCAGGAA 
ACGGCGGTCA 
TAAATTACAG 
GAAAATGTTA 
AGAAGAGGGC 
TCTCCAATCA 
CTTGACCACT 
CAACATGGTG 
TCATACTGTG 
GGAAAATCAG 
TCCCCGAACA 
CTCACGGCGT 
GGAAAGAGAA 
CTCTTTTATG 
CTTTTTTCTC 
TTTACTTATA 
TTTTTTATTG 
AA 



51 
1 

CCGTCATGTC 
TAGTTTCTCC 
TGCTATCAGA 
AGGACAGTAT 
TGGAACGACA 
AAGCACCCAA 
ACAGGTTCAC 
TAACTGTGAA 
ATGGAGT CAC 
TTCTCCCCCG 
CTGAT CTGAA 
AGGAGGAAAT 
CTTCCTTGAA 
GTGGCATTGC 
CAAGT CAT CG 
TCTCCATCTG 
CGCCTAGCCA 
CCTATGTGAA 
TAAAAGTGGG 
GCAGT CACAG 
CCAAGATCAG 
AGAGTGGTGA 
GCTGTATTGC 
TCCGTGACAG 
GCATGATTGT 
AGTTCTCAGC 
CCATCCCTGC 
GGGGCTAAGG 
TATGG CAAAG 
CGACAGGAAA 
GAACAGATGC 
TTGGAGGAAA 
CAAGAAGAGA 
GCCAGACAAC 
CAAAGGTTGG 
CAGTGCAAAG 
GAACCACCAC 
CAGAAGAATA 
GCAGAGAGAG 
TGTGATGACA 
CTAGTGAAAC 
TTGAAACTCC 
CAACCAAACC 
CCAACCTGCC 
TCCCCTTTAC 
GAGCAGTCAT 
CTTTACCATA 
ACTTTTGTAT 
TGATTTCTAT 
AATTCCAAAT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 



80 



85 



Seq ID NO: 26 Protein sequence: 
Protein Accession # : Eos sequence 



MSQGILSPPA 
SMEKVKVYLR 
FTFSQIFGPE 
PRSLALIFNS 
LKRSVYIESR 



11 
I 

GLLSDDDWV 
VRPLLPSELE 
VGQASFFNLT 
LQGQLHPTPD 
IGTSTSFDSG 



21 



SPMFESTAAD 
RQEDQGCVRI 
VKEMVKDVLK 
LKPLLSNEVI 
IAGLSSISQC 



31 
I 

LGSWRKNLL 
ENVETIiVLQA 
GQNWLIYTYG 
WLDSKQIRQE 
TSSSQLDETS 



41 
I 

SDCSWSTSL 
PKDSFALKSN 
VTNSGKTHTI 
EMKKLSLLNG 
HRWAQPDTAP 



51 



EDKQQVPSED 60 

ERGIGQATHR 120 

QGTIKDGGIL 180 

GLQEEELSTS 240 

LPVPANIRFS 30 0 



197 



WO 02/086443 

IWISFFEIYN ELLYDLIiEPP SQQRKRQTLR LCEDQNGNPY VKDLNWIHVQ DAEEAWKLLK 3 60 
VGRKNQSFAS THLNQNSSRS HSIFSIRILH LQGEGDIVPK ISELSLCDLA GSERCKDQKS 420 
GERLKE AGN I NTSLHTLGRC IAALRQNQQN RSKQNLVPFR DSKLTRVFQG FFTGRGRSCM 480 
IVNVNPCAST YDETLHVAKF SAIASQVTCA CPTYATGIPI PALVHQGT 



PCT/US02/12476 



Seq ID NO: 27 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 13-1424 



10 



15 



20 



25 



30 



35 



40 



TAGAAGTTTA 
CTTCCCCTGA 
TTAGAAAAAT 
GGAAACTTAA 
GGGCAACTGG 
GTCCATCATT 
AGAATCAATA 
GCTTTCCAAG 
GCTGACATTT 
AAAGGTGGAA 
TTCGATGAGG 
GTTCACGAGA 
TTCCCCACCT 
GGCATTCAGT 
TCAGAACCAG 
AAGATCTTTT 
AGTGTTAATT 
GAAATTGAAG 
AATTTAAGAC 
GTGAAAAAAA 
GATAACCAGT 
CTGATTACCA 
AACAAATACT 
CGTATCACCA 
TGGTTTTTGT 
GTGTACCACT 
TTATATAAAA 
CTCTACTATT 
CTCTGTAAGT 
TAAAATTAAG 



11 
I 

CAATGAAGTT 
ACAGCTCTAC 
TTTATGGCCT 
TGAAGGAAAA 
ACACATCTAC 
TCAGGGAAAT 
ATTACACACC 
TATGGAGTAA 
TGGTGGTTTT 
TCCTAGCCCA 
ACGAATTCTG 
TTGGCCATTC 
ACAAATATGT 
CCCTGTATGG 
CTCTCTGTGA 
TCTTCAAAGA 
TAATTTCTTC 
CCAGAAATCA 
CAGAGCCAAA 
TTGATGCAGC 
ATTGGAGGTA 
AGAACTTCCA 
ACTATTTCTT 
AAACACTGAA 
TAGTTCACTT 
ACTTAGAGAT 
TACATAATAT 
AAGTTTGAAA 
TGCTTCCTAA 
TATATATATT 



21 
I 

TCTTCTAATA 
AAGCCTGGAA 
TGAGATAAAC 
AAT CCAAGAA 
CCTGGAGATG 
GCCAGGGGGG 
TGACATGAAC 
TGTTACCCCC 
TGCCCGTGGA 
TGCTTTTGGA 
GACTACACAT 
CTTAGGTCTT 
TGACATCAAC 
AGACCCAAAA 
CCCCAATTTG 
CAGGTTCTTC 
CTTATGGCCA 
AGTTTTTCTT 
TTATCCCAAG 
TGTTTTTAAC 
TGATGAAAGG 
AGGAATCGGG 
CCAAGGATCT 
AAGCAATAGC 
CAGCTTAATA 
ATGTATCATA 
TTTTCAATTT 
ATAGTTACCT 
CATCCTTGGA 
TTGGCTCAAA 



31 

1 

CTGCTCCTGC 
AAAAATAATG 
AAACTTCCAG 
ATGCAGCACT 
ATGCACGCAC 
CCCGTATGGA 
CGTGAGGATG 
TTGAAATTCA 
GCT CATGGAG 
CCTGGATCTG 
TCAGGAGGCA 
GGCCATTCTA 
ACATTTCGCC 
GAGAACCAAC 
AGTTTTGATG 
TGGCTGAAGG 
ACCTTGCCAT 
TTTAAAGATG 
AGCATACATT 
CCACGTTTTT 
AGACAGATGA 
CCTAAAATTG 
AACCAATTTG 
TGGTTTGGTT 
AGTATTTATT 
AAAATAAAAT 
TGAAAACTCT 
TCAAAGCAAG 
CTGAGAAATT 
TAAAATTG 



41 
I 

AGGCCACTGC 
TGCTATTTGG 
TGACAAAAAT 
TCTTGGGTCT 
CTCGATGTGG 
GGAAACATTA 
TTGACTACGC 
GCAAGATTAA 
ACTTCCATGC 
GCATTGGAGG 
CAAACTTGTT 
GTGATCCAAA 
TCTCTGCTGA 
GCTTGCCAAA 
CTGTCACTAC 
TTTCTGAGAG 
CTGGCATTGA 
ACAAATACTG 
CTTTTGGTTT 
ATAGGACCTA 
TGGACCCTGG 
ATGCAGTCTT 
AATATGACTT 
GTTGAAAATG 
GCATATTTGC 
CTGTAAACCA 
AATTGTCCAT 
AT AAT T CT AT 
ATACTTACTT 



51 



TTCTGGAGCT 60 

TGAAAGATAC 12 0 

GAAATATAGT 180 

GAAAGTGACC 240 

AGT CCCCGAT 300 

TATCACCTAC 360 

AATCCGGAAA 420 

CACAGGCATG 480 

TTTTGATGGC 540 

GGATGCACAT 600 

CCTCACTGCT 660 

GGCCGTAATG 720 

TGACATACGT 780 

TCCTGACAAT 840 

CGTGGGAAAT 900 

ACCAAAGACC 960 

AGCTGCTTAT 1020 

GTTAATTAGC 10 80 

TCCTAACTTT 1140 

CTTCTTTGTA 1200 

TTATCCCAAA 1260 

CTACTCTAAA 1320 

CCTACTCCAA 1380 

GTGTAATTAA 1440 

TATGTCCTCA 1500 

TAGGTAATGA 1560 

TCTTGCTTGA 1620 

TTGAAGCATG 1680 

CTGGCATAAC 1740 



45 



Seq ID NO: 2 8 Protein sequence: 
Protein Accession #: Eos sequence 



50 



55 



60 



65 



70 



75 



80 



85 



MKFLLILLLQ 
KEKIQEMQHF 
YTPDMNREDV 
LAHAFGPGSG 
KYVDINTFRL 
FKDRFFWIiKV 
EPNYPKSIHS 
NFQGIGPKID 



11 
I 

ATASGALPLN 
LGLKVTGQLD 
DYAIRKAFQV 
I GGD AHFDED 
SADDIRGIQS 
SERPKTSVNL 
FGFPNFVKKI 
AVFYSKNKYY 



21 

1 

SSTSLEKNNV 
TSTLEMMHAP 
WSNVTPLKFS 
EFWTTHSGGT 
LYGDPKENQR 
ISSLWPTLPS 
DAAVFNPRFY 
YFFQGSNQFE 



31 
I 

LFGERYLEKF 
RCGVPDVHHF 
KINTGMAD I L 
NLFLTAVHEI 
LPNPDNSEPA 
GIEAAYEIEA 
RTYFFVDNQY 
YDFLLQRITK 



41 



51 



YGLEINKLPV 


TKMKYSGNLM 


60 


REMPGGPVWR 


KHYITYRINN 


120 


WFARGAHGD 


FHAFDGKGGI 


180 


GHSLGLGHSS 


DPKAVMFPTY 


240 


LCDPNLSFDA 


VTTVGNK IFF 


300 


RNQVFLFKDD 


KYWLISNLRP 


360 


WRYDERRQMM 


DPGYPKLITK 


420 


TLKSNSWFGC 







Seq ID NO: 29 DNA sequence 

Nucleic Acid Accession #: NM_006115.1 

Coding sequence: 236.. 1765 



11 



GCTTCAGGGT 
CGGGACACCC 
ACTCTCTGAG 
GAGACCTAGA 
ACGAAGGCGT 
CCCACGGAGA 
TGCCGCCCTG 
CGGGAGACAC 
TCTGGGAGTG 
TGGACTTGAT 
GGATT TACGG 
TCTGTACTCA 
TGGTTTGAGC 
CCTCAAGGAA 
GAAAAATGTA 
TAT C AAGATG 
TACCTGGAAG 
GCGTAGACTC 
GCAGTATATC 
TGTGG AC T CT 
CCCCTTGGAA 
GTCCCAGAGT 
CGATGTAAGT 
CCTGGTCTTT 
GAGCCACTGC 



ACAGCTCCCC 
CACCCGCTTC 
GAAAAACCAT 
AATCCAAGCG 
TTGTGGGGTT 
CTTGTGGAGC 
GAGTTGCTGC 
AGCCAGACCC 
CTGATGAAGG 
GTGCTCCTTG 
AAGAACTCTC 
TTTCCAGAGC 
ACAGAGGCAG 
GGTGCCTGTG 
CTACGCCTGT 
ATCCTGAAAA 
CTACCCACCT 
CTCCTCTCCC 
GCCCAGTTCA 
TTATTTTTCC 
ACCCTCTCAA 
CCCAGCGTCA 
CCCGAGCCCC 
GATGAGTGTG 
TCCCAGCTTA 



21 
I 

CGCAGCCAGA 
CCAGGCGTGA 
TTTGATTATT 
TTGGAGGTCC 
CC ATT CAG AG 
TGGCAGGGCA 
CCAGGGAGCT 
TGAAGGCAAT 
GACAACATCT 
CCCAGGAGGT 
AT CAGGACTT 
CAGAAGCAGC 
AGCAGCCCTT 
ATGAATTGTT 
GCTGTAAGAA 
TGGTGCAGCT 
TGGCGAAATT 
ACATCCATGC 
CCTCTCAGTT 
TTAGAGGCCG 
TAACTAACTG 
GTCAGCTAAG 
TCCAAGCTCT 
GGAT CACGGA 
CAACCTTAAG 



31 
I 

AGCCGGGCCT 
CCTGTCAACA 
ACTCTCAGAC 
TGAGGCCAGC 
CCGATACATC 
GAGCCTGCTG 
CTTCCCGCCA 
GGTGCAGGCC 
TCACCTGGAG 
TCGCCCCAGG 
CTGGACTGTA 
TCAGCCCATG 
CATTCCAGTA 
CTCCTACCTC 
GCTGAAGATT 
GGACTCTATT 
TTCTCCTTAC 
ATCTTCCTAC 
CCTCAGTCTG 
CCTGGATCAG 
CCGGCTTTCG 
TGTCCTGAGT 
GCTGGAGAGA 
TGAT CAGCTC 
CTTCTACGGG 



41 
I 

GCAGCCCCTC 
GCAACTTCGC 
GTGCGTGGCA 
CTAAGTCGCT 
AGCATGAGTG 
AAGGATGAGG 
CTCTTCATGG 
TGGCCCTTCA 
ACCTTCAAAG 
AGGTGGAAAC 
TGGTCTGGAA 
ACAAAGAAGC 
GAGGTGCTCG 
AT TGAGAAAG 
TTTGCAATGC 
GAAGATTTGG 
CTGGGCCAGA 
ATTTCCCCGG 
CAGTGCCTGC 
TTGCTCAGGC 
GAAGGGGATG 
CTAAGTGGGG 
GCCTCTGCCA 
CTTGCCCTCC 
AATTCCATCT 



51 



AGCACCGCTC 60 

GGTGTGGTGA 120 

ACAAGTGACT 180 

TCAAAATGGA 240 

TGTGGACAAG 300 

CCCTGGCCAT 360 

CAGCCTTTGA 420 

CCTGCCTCCC 480 

CTGTGCTTGA 540 

TTCAAGTGCT 600 

ACAGGGCCAG 660 

GAAAAGTAGA 720 

TAGACCTGTT 780 

TGAAGCGAAA 840 

CCATGCAGGA 900 

AAGTGACTTG 960 

TGATTAATCT 1020 

AGAAGGAAGA 1080 

AGGCTCTCTA 1140 

ACGTGATGAA 1200 

TGATGCATCT 1260 

TCATGCTGAC 132 0 

CCCTCCAGGA 1380 

TGCCTTCCCT 1440 

CCATATCTGC 1500 



198 



10 



WO 02/086443 

CTTGCAGAGT CTCCTGCAGC 
TGTCCCCCTG GAGAGTTATG 
TCTGCATGCC AGGCTCAGGG 
TAGTGCCAAC CCCTGTCCTC 
GTGCCCCTGT TTCATGCCTA 
TTGGACACTA AAGCCAGGAT 
ACAAATGTTC AGTGTGAGTG 
GTT CAGTGAG GAAAAAAAGG 
GTGATCTTTG GGGAGATACA 
GATTCTGGCT TGGGAAGTAC 
TGTTGAAAAT AAAGAGAAGC 



PCT/US02/12476 



ACCT CATCGG 
AGGACATCCA 
AGTTGCTGTG 
ACTGTGGGGA 
ACTAGCTGGG 
GTGCATGCAT 
AGGAAAACAT 
GGAAGTTGGG 
TCTTATAGAG 
ATGTAGGAGT 
AATGTGAAGC 



GCTGAGCAAT 
TGGTACCCTC 
TGAGTTGGGG 
CAGAACCTTC 
TGCACATATC 
CTTGAAGCAA 
GTT CAGTGAG 
GATAGGCAGA 
TTAGAAATAG 
TAATCCCTGT 
AAAAAAAAAA 



CTGACCCACG 
CACCTGGAGA 
CGGCCCAGCA 
TATGACCCGG 
AAATGCTTCA 
CAAAGCAGCC 
GAAAAAACAT 
TGTTGACTTG 
AATCTGAATT 
GTAGACTGTT 
AAAAAAAA 



TGCTGTATCC 1560 

GGCTTGCCTA 1620 

TGGTCTGGCT 1680 

AGCCCATCCT 1740 

TTCTGCATAC 1800 

ACAGTTTCAG 1860 

TCAGACAAAT 192 0 

AGGAGTTAAT 1980 

TCTAAAGGGA 2040 

GT AAAGAAAC 2100 



15 



Seq ID NO: 30 Protein sequence: 
Protein Accession #: NP_006106.1 
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GCTTCAGGGT 
CGGGACACCC 
ACTCTCTGAG 
GAGACCTAGA 
ACGAAGGCGT 
CCCACGGAGA 
TGCCGCCCTG 
CGGGAGACAC 
TCTGGGAGTG 
TGGACTTGAT 
GGATTTACGG 
TCTGTACTCA 
TGGTTTGAGC 
CCT CAAGGAA 
GAAAAATGTA 
TAT CAAGATG 
TACCTGGAAG 
GCGTAGACTC 
GCAGTATATC 
TGTGGACTCT 
CCCCTTGGAA 
GTCCCAGAGT 
CGATGTAAGT 
CCTGGTCTTT 
GAGCCACTGC 
CTTGCAGAGT 
TGTCCCCCTG 
TCTGCATGCC 
TAGTGCCAAC 
GTGCCCCTGT 
TTGGACACTA 
ACAAATGTTC 
GTT CAGTGAG 
GTGATCTTTG 
GATTCTGGCT 
TGTTGAAAAT 



11 
I 

ACAGCTCCCC 
CACCCGCTTC 
GAAAAACCAT 
AATCCAAGCG 
TTGTGGGGTT 
CTTGTGGAGC 
GAGTTGCTGC 
AGCCAGACCC 
CTGATGAAGG 
GTGCTCCTTG 
AAGAACTCTC 
TTTCCAGAGC 
ACAGAGGCAG 
GGTGCCTGTG 
CTACGCCTGT 
ATCCTGAAAA 
CTACCCACCT 
CTCCTCTCCC 
GCCCAGTTCA 
TTATTTTTCC 
ACCCTCTCAA 
CCCAGCGTCA 
CCCGAGCCCC 
GATGAGTGTG 
TCCCAGCTTA 
CTCCTGCAGC 
GAGAGTTATG 
AGGCTCAGGG 
CCCTGTCCTC 
TTCATGCCTA 
AAGCCAGGAT 
AGTGTGAGTG 
GAAAAAAAGG 
GGGAGATACA 
TGGGAAGTAC 
AAAGAGAAGC 



21 



31 



41 



51 



CGCAGCCAGA 
CCAGGCGTGA 
TTTGATTATT 
TTGGAGGTCC 
CCATT CAG AG 
TGGCAGGGCA 
CCAGGGAGCT 
TGAAGGCAAT 
GACAACATCT 
CCCAGGAGGT 
AT CAGGACTT 
CAGAAGCAGC 
AGCAGCCCTT 
ATGAATTGTT 
GCTGTAAGAA 
TGGTGCAGCT 
TGGCGAAATT 
ACATCCATGC 
CCTCTCAGTT 
TTAGAGGCCG 
TAACTAACTG 
GTCAGCTAAG 
TCCAAGCTCT 
GGAT CACGGA 
CAACCTTAAG 
ACCTCATCGG 
AGGACATCCA 
AGTTGCTGTG 
ACTGTGGGGA 
ACTAGCTGGG 
GTGCATGCAT 
AGGAAAACAT 
GGAAGTTGGG 
TCTTATAGAG 
ATGTAGGAGT 
AATGTGAAGC 



AGCCGGGCCT 
CCTGTCAACA 
ACTCTCAGAC 
TGAGGCCAGC 
CCGATACATC 
GAGCCTGCTG 
CTTCCCGCCA 
GGTGCAGGCC 
T C AC CTGGAG 
TCGCCCCAGG 
CTGGACTGTA 
TCAGCCCATG 
CATTCCAGTA 
CTCCTACCTC 
GCTGAAGATT 
GGACTCTATT 
TTCTCCTTAC 
ATCTTCCTAC 
CCTCAGTCTG 
CCTGGATCAG 
CCGGCTTTCG 
TGTCCTGAGT 
GCTGGAGAGA 
TGATCAGCTC 
CTTCTACGGG 
GCTGAGCAAT 
TGGTACCCTC 
TGAGTTGGGG 
CAGAACCTTC 
TGCACATATC 
CTTGAAGCAA 
GTTCAGTGAG 
GATAGGCAGA 
TTAGAAATAG 
TAATCCCTGT 
AAAAAAAAAA 



GCAGCGCCTC 
GCAACTTCGC 
GTGCGTGGCA 
CTAAGTCGCT 
AG CATGAGTG 
AAGGATGAGG 
CTCTTCATGG 
TGGCCCTTCA 
ACCTTCAAAG 
AGGTGGAAAC 
TGGT CTGGAA 
ACAAAGAAGC 
GAGGTGCTCG 
ATTGAGAAAG 
TTTGCAATGC 
GAAGATTTGG 
CTGGGCCAGA 
ATTTCCCCGG 
CAGTGCCTGC 
TTGCTCAGGC 
GAAGGGGATG 
CTAAGTGGGG 
GCCTCTGCCA 
CTTGCCCTCC 
AATTCCATCT 
CTGACCCACG 
CACCTGGAGA 
CGGCCCAGCA 
TATGACCCGG 
AAATGCTTCA 
CAAAGCAGCC 
GAAAAAACAT 
TGTTGACTTG 
AATCTGAATT 
GTAGACTGTT 
AAAAAAAA 



AGCACCGCTC 
GGTGTGGTGA 
ACAAGTGACT 
TCAAAATGGA 
TGTGGACAAG 
CCCTGGCCAT 
CAGCCTTTGA 
CCTGCCTCCC 
CTGTGCTTGA 
TTCAAGTGCT 
ACAGGGCCAG 
GAAAAGTAGA 
TAGACCTGTT 
TGAAGCGAAA 
CCATGCAGGA 
AAGTGACTTG 
TGATTAATCT 
AGAAGGAAGA 
AGGCTCTCTA 
ACGTGATGAA 
TGATGCATCT 
TCATGCTGAC 
CCCTCCAGGA 
TGCCTTCCCT 
CCATAT CTGC 
TGCTGTATCC 
GGCTTGCCTA 
TGGTCTGGCT 
AGCCCATCCT 
TTCTGCATAC 
ACAGTTTCAG 
TCAGACAAAT 
AGGAGTTAAT 
TCTAAAGGGA 
GTAAAGAAAC 



Seq ID NO: 31 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 64-2754 



11 



85 



GGCAGGTCTC 
CCGATGGCCG 
CTGACCCTCG 
CCTTCTAAAC 
TCTGCAGACC 
TACACAGCCA 
GACAAAAGGA 
TCGAAGACAA 
ATTCCTTGCT 
GAAT CTGATG 
AAAGAACCTT 
CCTGTGGATC 
GGATATTCAG 
CACCCTGTTT 
ACTACAGTGG 
CTGAAATACA 
AGCACAGGCG 
TCATTGATAA 
ACTTGTATCA 
TATGAAGCAT 
GATAAGGATT 
GAAAATGGAC 
GTAAAGCCAC 
GAAGCGCCAT 
GTTCATGTGA 
ATTAAAGAAA 



GCTCTCGGCA 
CCGCTGGGCC 
TGAT CTTCAG 
TAGAGGCAGA 
TCATCCGGTC 
GGGCTGTTGC 
AACAGACACA 
GACACACTAG 
CTATGCAAGA 
CAGCACAGAA 
TAAATTTGTT 
GTGAAGAATA 
CAGATCTGCC 
TCACAGAAGC 
GGGTGGTTTG 
GCATTTTGCA 
TAAT CACCAC 
TGAAAGTACA 
TAACAGTAAC 
TTGTAGAGGA 
TAATTAACAC 
ATTTCAAAAT 
TGAATTATGA 
TTGCTAGAGA 
GGGATCTGGA 
ACTTAGCAGT 



21 

I 

CCCTCCCGGC 
CCGGCGCTCC 
TCGTGATGGT 
CAAAATAATT 
AAGTGATCCT 
GCTGTCTGAT 
GAAAGAGGTT 
AGAAA CTGT T 
GAATTCCTTG 
CTATACTGTC 
TTATATAGAA 
TGATGTTTTT 
CCTCCCACTA 
AATTTATAAT 
TGCCACAGAC 
GCAGACACCA 
AGTCTCTCAT 
AGACATGGAT 
AGATTCAAAT 
AAATGCATTC 
TGCCAATTGG 
CAG CAC AG AC 
AGAAAACCGT 
TATTCCCAGA 
TGAGGGGCCT 
GGGGTCAAAG 



31 

I 

GCCCGCGTTC 
GTGCGCGGAG 
GAAGCCTGCA 
GGCAGAGTTA 
GATTTCAGAG 
AAGAAAAGAT 
ACTGTGCTGC 
CTCAGGCGTG 
GGCCCTTTCC 
TTCTACTCAA 
AGAGACACTG 
GATTTGATTG 
CCCAT CAGGG 
TTTGAAGTTT 
AGAGATGAAC 
AGGTCACCTG 
TATTTGGACA 
GGCCAGTTTT 
GATAATGCAC 
AATGTGGAAA 
AGAGTCAATT 
AAAGAAACTA 
CAAGTGAACC 
GTGACAGCCT 
GAATGCACTC 
AT CAACGGCT 



41 

] 

TCCTGGCCCT 
CCGTCTGCCT 
AAAAGGTGAT 
ATTTGGAAGA 
TTCTAAATGA 
CATTTACCAT 
TAGAACATCA 
CCAAGAGGAG 
CATTGTTTCT 
TAAGTGGACG 
GAAAT CTATT 
CTTATGCGTC 
TAGAGGATGA 
TGGAAAGTAG 
CGGACACAAT 
GGCTCTTTTC 
GAGAGGTTGT 
TTGGATTGAT 
CCACTTTCAG 
TCTTACGAAT 
TTACCATTTT 
ATGAAGGTGT 
TGGAAATTGG 
TGAACAGAGC 
CTGCAGCCCA 
ATAAGGCATA 



51 

I 

GCCCGGCATC 
GCATCTGCTG 
ACTTAATGTA 
GTGCTTCAGG 
TGGGTCAGTG 
ATGGCTTTCT 
GAAGAAGGTA 
ATGGGCACCT 
TCAACAAGTT 
TGGAGTTGAT 
TTGCACTCGG 
AACTGCAGAT 
AAATGACAAC 
TAGACCTGGT 
GCATACGCGC 
TGTGCATCCC 
AGACAAGTAC 
AGGCACAT CA 
ACAAAATGCT 
ACCTATAGAA 
AAAGGGAAAT 
TCTTTCTGTT 
AGTAAACAAT 
CTTGGTTACA 
ATATGTGCGG 
TGACCCCGAA 



60 
120 
180 
240 
300 
360 
420' 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 



60 
12 0 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
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WO 02/086443 

AATAGAAATG GCAATGGTTT 
ATTGATGAAA TTTCAGGGTC 
CCCAAAAATG AGTTGTATAA 
ACTGGAACAC TTGCTGTGAA 
GAATATGTAG TCATTTGCAA 
GATGAACCTG TCCATGGAGC 
AGTAGACTGT GGAGCCTCAC 
AATGCTGGAT TTCAAGAATA 
GCAACAAAAT TATTGAGAGT 
ACTT CAAGGA GTACAGGAGT 
ATAGCACTGC TCTTTTCTGT 
GGGAAACGTT TTCCTGAAGA 
CCTGGAGACG ATAGAGTGTG 
AGCCAAGGTT TTTGTGGTAC 
GAAATGATGA AAGGAGGAAA 
ACCCTGGACT CCTGCAGGGG 
GAGTGGCACA GTTTTACTCA 
GAAGACCGCA TGCCATCCCA 
CCAGCTGGTT CTGTGGGCTG 
AATAATTTGG AACCCAAATT 
AGTGCTACAA TTAGGTCTTT 
TTCAATTTCA ACATGTATGT 
CCAATTTATA TTTTTAAAGC 
AACAGACAAC TGGTAAATCT 
TCTTTTTTTT TTTTACGGAT 
ATAGGTAAGT TATGCTAATA 
ATAAACAAGA AATATTGAGT 
ACTGAATTAA ATTAAAAATG 
ACCAAATTCA TTTGACTTTG 
TCTATAGGAA TATAGTTGGA 
ATTTAAAATG AAATGAGAAC 
TAGTTTGTCC TACAATAGAA 
ATTATAACTG AGTCTATGAG 
GTAAATAAAT TAAACTTTTC 
TAGCTTTGCT TTGCAGTCTG 
GAAT ACT CGC TGCAGCTGGG 
TTTTTTTCGG GGAGCTAATA 
CTCTATTGCT GTTTCTATTC 
TAACCATGTC CTCCTAGAGT 
GCACCCTGGG GAG AT TG ATT 
GTCTGGGAGC TACAAAATTT 
CTGAATCAAG GAAAGCCAGG 
ACCTCCAGCA GAGATTCCCT 
AATTTTTAAT CAGTTTGCTT 
TTGAATGTAT AAAAGAAAAA 
AAGCAGCCCA AGTAGGTTAT 
GGGCAAGGAG AGGCCACAAG 
CTTTTTCCTA GGCTTGGCAC 
GTCCGGTGAG GGAT CAGCC A 
AAGGAGACAG AGCTGACTGC 
GTTGTGCAGA ACAAACAAGG 
CTGGGCACTA AGAAGGTCTA 
TTTTCTGTTT TCTAATTTGA 
CCCCCCCCCC TTTTTTTTTG 
GCTCCGATCT CTGCTCACTG 
GCCTCCTGAG TAGCTGGGAC 
TTTAATAGAG ACGGGGTTTC 
ATCCGCCTGC CTCGGCCTCC 
CTTGTTTTGC GTTTAAAGTC 
TGAT CATACG AATTGG AT CA 
GGGAGAAAGA ACTCAGGGCA 
TTGCTGAAAT TTCCTGCTGT 
ACTGTGTTTT GCTCACTCCC 
CTAGTGCCGA TAAACTTTCT 
TAACCATCTC TTTGTTCTTT 
TTTGTAATTC TTTTCTCTCA 
CATATGTAGT ATTATTATTT 
CAAGAAAATA TATTTTTAAA 
TGTAAATATA CAGAATGTTT 
GGGGTTTGTT TTGCAATGTT 
TGCTTTTAAA GAAACTTGGC 
TACAGATGTG GGGAGATGTA 
TAGAGATTAA ATAATTCTAA 
AATAGAAATA CTCAATTATG 
ATTAT CAAAT TGTCGACATC 
GAAGCACAGC TTTACAGATG 
ATTAAAAGTA TTAGAAGGTG 
AGGGGTTTTA CTTTGAGGAC 
GGCAATATTG CAGTCTTGAT 
CAAGATGATC C AAC CAT AAA 
AGTGTGCTCC CCTACAAACG 
AGCCTTACAT TTTAATATAG 
CATTATTTTT GTGTATGTCT 
ACCGGATACA TTTCACGTGT 
TGAGAAGCAT GGACACTAGA 
TTCTGTGTGA CCTTTGAAAG 
GAACAATGCC AGCCTCATGG 



PCT/US02/12476 



AAGGTACAAA 
AATCATAACT 
TATTACAGTC 
CATTGAAGAT 
ACCAAAAATG 
TCCATTTTAT 
CAAAGTTAAT 
TACCATTCCT 
TAATCTGTGT 
AATACTTGGA 
ATTGCTAACT 
TTTAGCACAG 
CTCTGCCAAT 
TATGGGATCA 
CCAGACCTTG 
AGGACACACG 
ACCCCGTCTC 
AGATTATGTC 
CTGCAGTGAA 
TATTACATTA 
GTCAGACATT 
ATATGATGAT 
CAGTTGTTGC 
CAAACTCCAG 
ATTTTAGTAA 
TCACATTATT 
AT CACTATGT 
TTGCAGCTCA 
GAGGCAAAAT 
AATAAATGTG 
AAAGAGGAAA 
AAAAGAGAGA 
GAAAT AGTT C 
TGGTTTCTGT 
TTTCAAGATT 
GTTCCCTGCT 
ACAAAAACAT 
TCT CTTATAG 
TTAGAGGCTA 
GTCCTTAAAC 
CATTTTTCTC 
CCTTGTGGGC 
TAAGTGACTC 
TCTCCAGAGA 
GATCAAGTTG 
TTGTACAGTC 
GAAT AT GGGT 
TGCCTTTTCC 
ACCTCTTCTC 
ATGATGAGTC 
CATT CATGGG 
TGAATTAAAT 
CCCTAAAATC 
AGACGGAGTC 
AAAGCTCCGC 
TACAGGCGCC 
ACTGTGTTAG 
CAAAGTGCTG 
GTCTTCTTTT 
AT CT TGAAAT 
CAAAATATTG 
AACCAGAAGC 
TCACTCACCG 
CAAAGAGCAA 
GAACATGCTG 
AATGAAAAT T 
CCTTATATGT 
GCTTTCATTT 
TTTCTTACTT 
TTAAACAGAG 
TGCTTAAAAT 
ATAAAACAAT 
GATGATCACT 
TCTTTGTTGT 
ATTAATATAT 
AGTATCTATG 
GTTATAATTG 
CAGTGTAGTC 
TCTGCCACTT 
GGTGCTCTGT 
TTAAGACTGA 
GTTGAACCAA 
TCAAGAATGT 
CCTTCAGTAT 
GCCAGAATGC 
GCTACTTATT 
GGTTGTTGAA 



AAATTGCATG 

TCCAAAATCC 

CTGGCAATAG 

GTAAATGATA 

GGGTATACCG 

TTCAGTTTGC 

GATACAGCTG 

ATTACTGTAA 

GAATGTACTC 

AAATGGGCAA 

TTAGTATGTG 

CAAAACTTAA 

GGATTTATGA 

GGAATGAAAA 

GAATCCTGCC 

GAGGTGGACA 

GGTGAAAAAT 

CTCACTTATA 

AAG CAGGAAG 

GCAGAAGCAT 

CTGGAGGTTT 

TTTTTTCTCA 

TTATCTTTTC 

CACTGGAATT 

TAAATATGCT 

ATGTATTCAC 

GAAGAAAGTT 

TAAAGAATTG 

GTGTTGAAGT 

TGTGTGTATA 

AT GGT AAAAA 

GCTTCCTAGG 

CTGTCCAATT 

GGGAAGGAAA 

TCTGCATCCA 

TTTTGGTAGC 

TTTAAAACTT 

TGACCAACAT 

GAGGGAGCTG 

CTAAGCCCCA 

CTCACTGCCC 

CCCCTTCTTT 

CAGGTTTTCC 

AATTTTAAAA 

TCATTTTAGA 

AGAGGGCAAC 

GGGAGTAAAA 

TTTCTCAGGC 

TATGGCTCAC 

TGAAGGCATT 

AATTGTTGTA 

GCCTATCTAA 

TATGTGTTTT 

TCGCTCTGAC 

CTCCCGGGTT 

CACCACCACG 

CCAGGATGGT 

GGATTACAGG 

AATGTAATCA 

ACTCAACCAA 

GTCTGAGAAT 

CAGTTTTATC 

ATCAAAACCT 

CCAGTATCAC 

AAAACCACCT 

TAATTTTAGG 

GTAAGGTGAA 

TTCCCCCAGT 

TTATAAGGAA 

TTTTAGTATT 

AAGCAAAAAT 

ATTAACTTGG 

TTGCAAAATT 

ATTAATGGGG 

ATTGTAATGT 

ATACATATGT 

CAGAGTATTC 

AAGGGAAAAC 

ACAGGATAGA 

GCTTCACAGT 

TCATTTCAAA 

AATTTCAATr 

TCATTGGATT 

TGATTTGGTT 

TTGGATATGA 

TCCTCTCTTA 

TGATTAAATT 



ATCCTAAAGG 
TGGATAGGGA 
ACAAAGATGA 
ATCCACCAGA 
ACATTTTAGC 
CCAATACTTC 
CCCGTCTTTC 
AAGACAGGGC 
ATCCAACTCA 
TCCTTGCAAT 
GAGTTTTTGG 
TTAT AT C AAA 
CCCAAACTAC 
ATGGAGGGCA 
GGGGGGCTGG 
ACTGCAGATA 
TGCATCGATG 
ACTATGAGGG 
AAGATGGCCT 
GCACAAAGAG 
CCAAAAATAA 
ATTTTGAATT 
CAAAAAGTGA 
AAGGTCTCTA 
GGATAAATAT 
TTTAAGTGAT 
TTGGAAAAGA 
GGACTCACCC 
GCCCTATGAA 
TTATTATTAA 
CTTGAAATGA 
CCTGGGCTCT 
TGTGTAATTT 
TAGGGAATCC 
CAAGTTAGTA 
AAGGGT CCAG 
ACCTTTACTG 
CTTTTTAATT 
AGGGGAGGAT 
CAAACTTGAC 
TTCTTCTGAG 
CGGCTTTCTG 
ACCATCCTTC 
TAATAGAAGA 
ACAGAGGGAA 
AGGAAGATGC 
GCAACATCGT 
CAATGGCAAC 
CTTATTTGGA 
TGCAGGATGA 
TTCCTTCTGC 
AATTCTGATT 
AGACTTAGAC 
GCACAGGCTG 
CATGCCATTC 
CCCGGCTAAT 
CTCGATCTCC 
CATGACCCAC 
TTTTGAACAT 
AAGACAGTCG 
GGAATTCTCT 
TAACGGCTAC 
GCTACCTCCC 
TTCCCTGTTT 
GGTCTGCATG 
GATTCATTTC 
ATTTATGGTA 
GAATGATTTA 
GCAGCTGTCT 
GCTATTAAAA 
TGGATGCATA 
TTTCTTGTTT 
ATGCTTATGG 
AATATTTTGG 
TGGGAAGAGA 
ATAATAAATT 
CATGAATAGT 
ATGAGTTAAA 
TAATGCCTGA 
GAATCTTTTC 
AATCTATTAG 
CCAGTAACTT 
TTTGTTTGTA 
GAATATTGGG 
ATCCTGGATC 
GCTTTCTCAT 
AGTTAATATA 



TTGGATCACC 1620 

GGTTGAAACT 1680 

TAGATCATGT 1740 

AATACTTCAA 1800 

TGTTGATCCT 1860 

TCCAGAAATC 192 0 

ATATCAGAAA 1980 

CGGCCAAGCT 2 040 

GTGTCGTGCG 2100 

ATTACTGGGT 2160 

TGCAACTAAA 2220 

CAC AG AAG CA 2280 

CAACAACT CT 2340 

GGAAACCATT 2400 

GCATCAT CAT 2460 

CACTTACTCG 2520 

TAATCAGAAT 2580 

AAGAGGATCT 2640 

TGACTTTTTA 2700 

ATAATGTCAC 2760 

TATTGTAAAG 282 0 

ATGCTACTCA 2880 

AAAATGTTAA 2940 

AAGCATCTGC 3 00 0 

TAGTCCAACA 3 0 60 

AGTTTAAAAA 3120 

AACAATGAAG 3180 

CTACTGCACT 3240 

GTAGCAATTT 3300 

TCAATGCAAT 3360 

GGCTGGGGTA 3420 

TAAATGCTGC 3480 

GTTTAAAATT 3540 

AATGGAACAG 3600 

GCAAACTGGG 3 660 

AGATGAGGTG 372 0 

AAGTTAAATC 3780 

TAGATCCAAA 3 840 

CTTACTGAAA 3900 

ACCTGATCAG 3 960 

TGGCATTGGC 4020 

CTAAAGCAAC 4080 

AGCGTGAATT 4140 

AATAGAAATT 42 00 

CTTTGGGAGA 42 60 

AGGCCTTCAA 432 0 

CTGCTTCATA 4380 

TGCCATTTGA 4440 

GTGAGAAATC 4500 

GCCTGAACTG 4560 

AGCCCTCCTT 4620 

TATTCCTACA 4680 

TTTTTATTGC 4740 

GAGTGCAGTG 4800 

TCCTGCCTCA 4860 

TTTTTGTATT 4920 

TGACCTCGTG 4980 

CGCTCCCGGC 5040 

GTGTGAAAGT 5100 

AGAAGCCAGG 5160 

GTAAGCCTAG 5220 

TGAAACACCC 52 80 

CAAGACTTTA 5340 

ATAAAACCTC 540 0 

TATGCCCGAA 5460 

TATATTTTCA 5520 

TTTGAGTGTG 5580 

GAATTTTTTA 5640 

AAAATGCAGT 5700 

GAAGTTACTT 5760 

AAGTAATATT 582 0 

TTGCTGTATT 5880 

CTGGCATGGA 5940 

ACAATGTTTC 600 0 

TCACTATTTT 6060 

TTGAT CGGGT 6120 

ACACTGACAC 6180 

AAGAAAAGCA 6240 

ACTTTAATGA 6300 

CCCATGCAGG 6360 

CTATAT CAAA 6420 

CTATTGTAAC 6480 

AT AGTAAAAT 6540 

TCATAATGGT 6600 

TGTCACTTAC 6660 

TAAAATCAAT 6720 

CCTAAAGTAC 6780 



200 



WO 02/086443 

ATAGAACACT GCCTGCACAT AGTAAAAGAA TTATAAGTGT GAGGTAGTTG GTAAAATTAT 
GTAGTTGGAT ATACTACCGA ACAATATCTA ATCTCTTTTT AGGGAAATAA AGTTTGTGCA 
TATATATAAT CCCGAAACAT G 



6840 
6900 
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Seq ID NO: 32 Protein sequence: 
Protein Accession #: NP 001932.1 
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MAAAGPRRSV 
ADLIRSSDPD 
KTRHTRETVL 
EPLNLFYIER 
PVFTEAIYNF 
TGVITTVSHY 
EAFVEENAFN 
KPLNYEENRQ 
KENLAVGSKI 
KNELYNITVL 
EPVHGAPFYF 
TKLLRVNLCE 
KRFPEDLAQQ 
MMKGGNQTLE 
DRMPSQDYVL 



11 
1 

RGAVCLHLLL 
FRVLNDGSVY 
RRAKRRWAPI 
DTGNLFCTRP 
EVLESSRPGT 
LDREWDKYS 
VEILRIPIED 
VNLEIGVNNE 
NGYKAYDPEN 
AIDKDDRSCT 
SLPNTSPEIS 
CTHPTQCRAT 
NLIISNTEAP 
SCRGAGHHHT 
TYNYEGRGSP 



21 
I 

TLVIFSRDGE 
T ARAVAL SDK 
PCSMQENSLG 
VDREEYDVFD 
TVGWCATDR 
LIMKVQDMDG 
KDLINTANWR 
APFARDIPRV 
RNGNGDRYKK 
GTLAVNIEDV 
RLWSLTKVND 
SRSTGVILGK 
GDDRVCSANG 
LDSCRGGHTE 
AGSVGCCSEK 



31 



ACKKVILNVP 
KRSFTIWLSD 
PFPLFLQQVE 
LIAYASTADG 
DEPDTMHTRL 
QFFGLIGTST 
VNFTILKGNE 
TALNRALVTV 
LHDPKGWITI 
NDNPPEILQE 
TAARLSYQKN 
WAILAILLGI 
FMTQTTNNSS 
VDNCRYTYSE 
QEEDGLDFLN 



41 
I 

SKLEADKIIG 
KRKQTQKEVT 
SDAAQNYTVF 
YSADLPLPLP 
KYSILQQTPR 
CIITVTDSND 
NGHFKISTDK 
HVRDLDEGPE 
DEISGSIITS 
YWICKPKMG 
AGFQEYTIPI 
ALLFSVLLTIi 
QGFCGTMGSG 
WHSFTQPRLG 
NLEPKFITLA 



51 

1 

RVNLEECFRS 
VLIjEHQKKVS 
YS I SGRGVDK 
IRVEDENDNH 
SPGLFSVHPS 
NAPTFRQNAY 
ETNEGVLSW 
CTPAAQYVRI 
KILDREVETP 
YTDILAVDPD 
TVKDRAGQAA 
VCGVFGATKG 
MKNGGQETIE 
EKLHRCNQNE 
EACTKR 



Seq ID NO: 33 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 64-25 83 



11 



85 



GGCAGGTCTC 
CCGATGGCCG 
CTGACCCTCG 
CCTTCTAAAC 
TCTGCAGACC 
TACACAGCCA 
GACAAAAGGA 
TCGAAGACAA 
ATTCCTTGCT 
GAAT CTGATG 
AAAGAACCTT 
CCTGTGGATC 
GGATATTCAG 
CACCCTGTTT 
ACTACAGTGG 
CTGAAATACA 
AGCACAGGCG 
TCATTGATAA 
ACTTGTATCA 
TATGAAGCAT 
GATAAGGATT 
GAAAATGGAC 
GTAAAGCCAC 
GAAGCGCCAT 
GTTCATGTGA 
ATTAAAGAAA 
AATAGAAATG 
ATTGATGAAA 
CCCAAAAATG 
ACTGGAACAC 
GAATATGTAG 
GATGAACCTG 
AGTAGACTGT 
AATGCTGGAT 
GCAACAAAAT 
ACTTCAAGGA 
ATAGCACTGC 
GGGAAACGTT 
CCTGGAGACG 
AGCCAAGGTT 
GAAATGATGA 
ACCCTGGACT 
GAGTGGCACA 
TAAAAATTAA 
CCAAGATTAT 
CTGCTGCAGT 
ATTTATTACA 
TTTGT CAGAC 
TGTATATGAT 
AGCCAGTTGT 
TCTCAAACTC 
GATATTTTAG 
ATATCACATT 
AGTATCACTA 
ATGTTGCAGC 



GCTCTCGGCA 
CCGCTGGGCC 
TGATCTTCAG 
TAGAGGCAGA 
TCATCCGGTC 
GGGCTGTTGC 
AACAGACACA 
GACACACTAG 
CTATG CAAGA 
CAGCACAGAA 
TAAATTTGTT 
GTGAAGAATA 
CAGATCTGCC 
TCACAGAAGC 
GGGTGGTTTG 
GCATTTTGCA 
TAAT CACCAC 
TGAAAGTACA 
TAACAGTAAC 
TTGTAGAGGA 
TAATTAACAC 
ATTTCAAAAT 
TGAATTATGA 
TTGCTAGAGA 
GGGATCTGGA 
ACTTAGCAGT 
GCAATGGTTT 
TTTCAGGGTC 
AGTTGTATAA 
TTGCTGTGAA 
TCATTTGCAA 
TCCATGGAGC 
GGAGCCTCAC 
TTCAAGAATA 
TATTGAGAGT 
GTACAGGAGT 
TCTTTTCTGT 
TTCCTGAAGA 
ATAGAGTGTG 
TTTGTGGTAC 
AAGGAGGAAA 
CCTGCAGGGG 
GTTTTACTCA 
ACATAAAAGA 
GTCCTCACTT 
GAAAAGCAGG 
TTAGCAGAAG 
ATTCTGGAGG 
GATTTTTTTC 
TGCTTATCTT 
CAGCACTGGA 
TAATAAATAT 
ATTATGTATT 
TGTGAAGAAA 
TCATAAAGAA 



21 
I 

CCCTCCCGGC 
CCGGCGCTCC 
TCGTGATGGT 
CAAAATAATT 
AAGTGAT CCT 
GCTGTCTGAT 
GAAAGAGGTT 
AGAAACTGTT 
GAATTCCTTG 
CTATACTGTC 
TTATATAGAA 
TGATGTTTTT 
CCTCCCACTA 
AATTTATAAT 
TG C C ACAG AC 
GCAGACACCA 
AGTCTCTCAT 
AGACATGGAT 
AGATTCAAAT 
AAATGCATTC 
TGCCAATTGG 
CAGCACAGAC 
AGAAAACCGT 
TATTCCCAGA 
TGAGGGGCCT 
GGGGTCAAAG 
AAGGTACAAA 
AATCATAACT 
TATTACAGTC 
CATTGAAGAT 
ACCAAAAATG 
TCCATTTTAT 
CAAAGT TAAT 
TACCATTCCT 
TAATCTGTGT 
AATACTTGGA 
ATTGCTAACT 
TTTAGCACAG 
CTCTGCCAAT 
TATGGGATCA 
CCAGACCTTG 
AGGACACACG 
ACCCCGTCTC 
AATTGCATCG 
ATAACTATGA 
AAGAAGATGG 
CATGCACAAA 
TTTCCAAAAA 
TCAATTTTGA 
TTCCAAAAAG 
ATTAAGGTCT 
GCTGGATAAA 
CACTT TAAGT 
GTTTTGGAAA 
TTGGGACTCA 



31 

I 

GCCCGCGTTC 
GTGCGCGGAG 
GAAGCCTGCA 
GGCAGAGTTA 
GATTTCAGAG 
AAGAAAAGAT 
ACTGTGCTGC 
CTCAGGCGTG 
GGCCCTTTCC 
TTCTACTCAA 
AGAGACACTG 
GATTTGATTG 
CCCATCAGGG 
TTTGAAGTTT 
AGAGATGAAC 
AGGTCACCTG 
TATTTGGACA 
GGCCAGTTTT 
GATAATGCAC 
AATGTGGAAA 
AGAGTCAATT 
AAAGAAACTA 
CAAGTGAACC 
GTGACAGCCT 
GAATGCACTC 
AT CAACGGCT 
AAATTGCATG 
TCCAAAATCC 
CTGGCAATAG 
GTAAATGATA 
GGGTATACCG 
TTCAGTTTGC 
GATACAGCTG 
AT T ACTGT AA 
GAATGTACTC 
AAATGGGCAA 
TTAGTATGTG 
CAAAACTTAA 
GGATTTATGA 
GGAATGAAAA 
GAATCCTGCC 
GAGGTGGACA 
GGTGAAGAAT 
ATGTAATCAG 
GGGAAGAGGA 
CCTTGACTTT 
GAGATAATGT 
TAATATTGTA 
ATTATGCTAC 
TGAAAAATGT 
CTAAAGCATC 
TATTAGTCCA 
GATAGTTTAA 
AGAAACAATG 
CCCCTACTGC 



41 



TCCTGGCCCT 
CCGTCTGCCT 
AAAAGGTGAT 
ATTTGGAAGA 
TTCTAAATGA 
CATTTACCAT 
TAGAACATCA 
CCAAGAGGAG 
CATTGTTTCT 
TAAGTGGACG 
GAAATCTATT 
CTTATGCGTC 
TAGAGGATGA 
TGGAAAGTAG 
CGGACACAAT 
GGCTCTTTTC 
GAGAGGTTGT 
TTGGATTGAT 
CCACTTTCAG 
TCTTACGAAT 
TTACCATTTT 
ATGAAGGTGT 
TGGAAATTGG 
TGAACAGAGC 
CTGCAGCCCA 
ATAAGGCATA 
ATCCTAAAGG 
TGGATAGGGA 
ACAAAGATGA 
ATCCACCAGA 
ACATTTTAGC 
CCAATACTTC 
CCCGTCTTTC 
AAGACAGGGC 
AT CCAACTCA 
TCCTTGCAAT 
GAGTTTTTGG 
TTATATCAAA 
CCCAAACTAC 
ATGGAGGGCA 
GGGGGGCTGG 
ACTGCAGATA 
CCATTAGAGG 
AATGAAGACC 
TCTCCAGCTG 
TTAAATAATT 
CACAGTGCTA 
AAGTT CAATT 
TCACCAATTT 
TAAAACAGAC 
TGCTCTTTTT 
ACAATAGCTA 
AAAATAAACA 
AAGACTGAAT 
ACTACCAAAT 



51 
I 

GCCCGGCATC 
GCATCTGCTG 
ACTTAATGTA 
GTGCTTCAGG 
TGGGT CAGTG 
ATGGCTTTCT 
GAAGAAGGTA 
ATGGGCACCT 
TCAACAAGTT 
TGGAGTTGAT 
TTGCACTCGG 
AACTG CAGAT 
AAATGACAAC 
TAGACCTGGT 
GCATACGCGC 
TGTGCATCCC 
AGACAAGTAC 
AGGCACATCA 
ACAAAATGCT 
ACCTATAGAA 
AAAGGGAAAT 
TCTTTCTGTT 
AGTAAACAAT 
CTTGGTTACA 
ATATGTGCGG 
TGACCCCGAA 
TTGGATCACC 
GGTTGAAACT 
TAGATCATGT 
AATACTTCAA 
TGTTGATCCT 
TCCAGAAATC 
ATATCAGAAA 
CGGCCAAGCT 
GTGTCGTGCG 
ATTACTGGGT 
TGCAACTAAA 
CACAGAAGCA 
CAACAACTCT 
GGAAACCATT 
GCATCAT CAT 
CACTT ACT CG 
ACACACTGGT 
GCATGCCATC 
GTTCTGTGGG 
TGGAACCCAA 
CAATTAGGTC 
TCAACATGTA 
ATATTTTTAA 
AACTGGTAAA 
TTTTTTTACG 
AGTTATGCTA 
AGAAATATTG 
TAAATTAAAA 
TCATTTGACT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
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TTGGAGGCAA AATGTGTTGA 
GGAAATAAAT GTGTGTGTGT 
AACAAAGAGG AAAATGGTAA 
GAAAAAAGAG AGAGCTTCCT 
GAGGAAATAG TTCCTGTCCA 
TTCTGGTTTC TGTGGGAAGG 
CTGTTTCAAG ATTTCTGCAT 
GGGGTTCCCT GCTTTTTGGT 
ATAACAAAAA CATTTTAAAA 
TTCTCTCTTA TAGTGACCAA 
AGTTTAGAGG CTAGAGGGAG 
ATTGTCCTTA AACCTAAGCC 
TTTCATTTTT CTCCTCACTG 
AGGCCTTGTG GGCCCCCTTC 
CCTTAAGTGA CTCCAGGTTT 
CTTTCTCCAG AGAAATTTTA 
AAAGATCAAG TTGTCATTTT 
TATTTGTACA GTCAGAGGGC 
AAGGAATATG GGTGGGAGTA 
CACTGCCTTT TCCTTTCTCA 
CCAACCTCTT CTCTATGGCT 
TGCATGATGA GTCTGAAGGC 
AGGCATTCAT GGGAATTGTT 
CTATGAATTA AATGCCTATC 
TGACCCTAAA ATCTATGTGT 
TTGAGACGGA GTCTCGCTCT 
CTGAAAGCTC CGCCTCCCGG 
GACTACAGGC GCCCACCACC 
TTCACTGTGT TAG CCAGGAT 
TCCCAAAGTG CTGGGATTAC 
GTCGTCTTCT T TTAATGTAA 
TCAATCTTGA AATACTCAAC 
GCACAAAATA TTGGT CTGAG 
TGTAACCAGA AGCCAGTTTT 
CCCACTCACC GATCAAAACC 
TCAAAGAGCA ACCAGT AT CA 
TGAACATGCT GAAAACCACC 
AAATGAAAAT TTAATTTTAG 
TCCTTATATG TGTAAGGTGA 
AGCTTTCATT TTTCCCCCAG 
TTTTCTTACT TTTATAAGGA 
TTTAAACAGA GTTTTAGTAT 
CTGCTTAAAA TAAGCAAAAA 
AATAAAACAA TATTAACTTG 
TTTACAGATG TGGGGAGATG 
TTTAGAGATT AAATAATTCT 
GAAATAGAAA TACTCAATTA 
TCATTATCAA ATTGTCGACA 
TTGAAGCACA GCTTTACAGA 
GTATTAAAAG TATTAGAAGG 
ACAGGGGTTT TACTTTGAGG 
CAGGCAATAT TGCAGTCTTG 
GACAAGATGA TCCAACCATA 
GGAGTGTGCT CCCCTACAAA 
AAAGCCTTAC ATTTTAATAT 
ACCATTATTT TTGTGTATGT 
ATACCGGATA CATTTCACGT 
GTTGAGAAGC ATGGACACTA 
ACTTCTGTGT GACCTTTGAA 
ATGAACAATG CCAGCCTCAT 
ACATAGAACA CTGCCTGCAC 
ATGTAGTTGG ATATACTACC 
CATATATATA AT CCCGAAAC 
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AGTGCCCTAT 
ATATTATTAT 
AAACTTGAAA 
AGGCCTGGGC 
ATTTGTGTAA 
AAATAGGGAA 
CCACAAGTTA 
AGCAAGGGTC 
CTTACCTTTA 
CATCTTTTTA 
CTGAGGGGAG 
CCACAAACTT 
CCCTTCTTCT 
TTTCGGCTTT 
TCCACCATCC 
AAATAATAGA 
AGAACAGAGG 
AACAGGAAGA 
AAAGCAACAT 
GGCCAATGGC 
CACCTTATTT 
ATTTGCAGGA 
GTATTCCTTC 
TAAAATTCTG 
TTTAGACTTA 
GACGCACAGG 
GTTCATGCCA 
ACGCCCGGCT 
GGTCTCGATC 
AGGCATGACC 
TCATTTTGAA 
CAAAAGACAG 
AATGGAATTC 
ATCTAACGGC 
TGCTACCTCC 
CTTCCCTGTT 
TGGT CTG CAT 
GGATTCATTT 
AATTTATGGT 
TGAATGATTT 
AGCAGCTGTC 
TGCTATTAAA 
TTGGATGCAT 
GCTGCTTAAA 
TAATAAAACA 
AAGATGATCA 
TGTCTTTGTT 
TCATTAATAT 
TGAGTATCTA 
TGGTTATAAT 
ACCAGTGTAG 
ATTGTGCCAC 
AAGGTGCTCT 
CGTTAAGACT 
AGGTTGAACC 
CTTCAAGAAT 
GTCCTTCAGT 
GAGCCAGAAT 
AGGCTACTTA 
GGGGT TGTTG 
ATAGTAAAAG 
GAACAATAT C 
ATG 



GAAGT AG CAA 
TAATCAATGC 
TGAGG CTGGG 
TCTTAAATGC 
TTTGTTTAAA 
TCCAATGGAA 
GTAGCAAACT 
CAGAGATGAG 
CTGAAGTTAA 
AT TTAGATCC 
GATCTTACTG 
GACACCTGAT 
GAGTGGCATT 
CTGCTAAAGC 
TTCAGCGTGA 
AGAAATAGAA 
GAACT TTGGG 
TGCAGGCCTT 
CGTCTGCTTC 
AACTGCCATT 
GGAGTGAGAA 
TGAGCCTGAA 
TGCAGCCCTC 
ATTTATTCCT 
GACTTTTTAT 
CTGGAGTGCA 
TTCTCCTGCC 
AATTTTTTGT 
TCCTGACCTC 
CACCGCTCCC 
CAT GTGTGAA 
TCGAGAAGCC 
TCTGTAAGCC 
TACTGAAACA 
CCAAGACTTT 
TATAAAACCT 
GTATGCCCGA 
CTATATTTTC 
ATTTGAGTGT 
AGAATTTTTT 
TAAAATGCAG 
AGAAGTTACT 
AAAGTAATAT 
ATAAGCAAAA 
ATATTAACTT 
CTTTGCAAAA 
GTATTAATGG 
ATATTGTAAT 
TGATACATAT 
TGCAGAGTAT 
T CAAGGG AAA 
TTACAGGATA 
GTGCTTCACA 
GATCATTTCA 
AAAATTTCAA 
GTT CATTGGA 
ATTGATTTGG 
GCTTGGATAT 
TTTCCTCTCT 
AATGATTAAA 
AATTATAAGT 
TAATCTCTTT 



TTTTCTATAG 
AATATTTAAA 
GTATAGTTTG 
TGCATTATAA 
ATTGTAAATA 
CAGTAGCTTT 
GGGGAATACT 
GTGTTTTTTT 
ATCCTCTATT 
AAAT AAC CAT 
AAAGCACCCT 
CAGGTCTGGG 
GGCCTGAATC 
AACACCTCCA 
ATTAATTTTT 
ATTTTGAATG 
AGAAAGCAGC 
CAAGGGCAAG 
ATACTTTTTC 
TGAGTCCGGT 
ATCAAGGAGA 
CTGGTTGTGC 
CTTCTGGGCA 
ACATTTTCTG 
TGCCCCCCCC 
GTGGCTCCGA 
TCAGCCTCCT 
ATTTTTAATA 
GTGATCCGCC 
GGCCTTGTTT 
AGTTGATCAT 
AGGGGGAGAA 
TAGTTGCTGA 
CCCACTGTGT 
ACTAGTGCCG 
CTAACCATCT 
ATTTGTAATT 
ACATATGTAG 
GCAAGAAAAT 
ATGTAAATAT 
TGGGGTTTGT 
TTGCTTTTAA 
TTACAGATGT 
ATTGGATGCA 
GGTTTCTTGT 
TTATGCTTAT 
GGAATATTTT 
GTTGGGAAGA 
GTATAATAAA 
TCCATGAATA 
ACATGAGTTA 
GATAATGCCT 
GTGAATCTTT 
AAAAT CTATT 
TTCCAGTAAC 
TTTTTGTTTG 
TTGAATATTG 
GAATCCTGGA 
TAGCTTTCTC 
TTAGTTAATA 
GTGAGGTAGT 
TTAGGGAAAT 



GAATATAGTT 
ATGAAATGAG 
T CCTACAAT A 
CTGAGTCTAT 
AATTAAACTT 
GCTTTGCAGT 
CGCTGCAGCT 
CGGGGAGCTA 
GCTGTTTCTA 
GTCCTCCTAG 
GGGGAGATTG 
AGCTACAAAA 
AAGGAAAGCC 
GCAGAGATTC 
AATCAGTTTG 
TATAAAAGAA 
CCAAGTAGGT 
GAGAGGCCAC 
CTAGGCTTGG 
GAGGGAT CAG 
CAGAGCTGAC 
AGAACAAACA 
CTAAGAAGGT 
TTTTCTAATT 
CCCTTTTTTT 
TCTCTGCTCA 
GAGTAGCTGG 
GAGACGGGGT 
TGCCTCGGCC 
TCCGTTTAAA 
ACGAATTGGA 
AGAACTCAGG 
AATTTCCTGC 
TTTGCTCACT 
ATAAACTTTC 
CTTTGTTCTT 
CTTTTCTCTC 
TATTATTATT 
ATATTTTTAA 
ACAGAATGTT 
TTTGCAATGT 
AGAAACTTGG 
GGGGAGATGT 
TAAAGTAATA 
TTTTGCTGTA 
GGCTGGCATG 
GGACAATGTT 
GATCACTATT 
TTTTGATCGG 
GTACACTGAC 
AAAAGAAAAG 
GAACTTTAAT 
TCCCCATGCA 
AG CTAT ATCA 
TTCTATTGTA 
TAATAGTAAA 
GGTCATAATG 
TCTGTCACTT 
AT T AAAAT CA 
TACCTAAAGT 
TGGTAAAATT 
AAAGTTTGTG 



Seq ID NO: 3 4 Protein sequence: 
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MAAAGPRR S V 
ADLIRSSDPD 
KTRHTRETVL 
EPLNLFYIER 
PVFTEAIYNF 
TGVITTVSHY 
EAFVEENAFN 
KPLNYEENRQ 
KENLAVGSKI 
KNELYNITVL 
EPVHGAPFYF 
TKLLRVNLCE 
KRFPEDLAQQ 
MMKGGNQTLE 



11 
I 

RGAVCLHLLL 
FRVLNDGSVY 
RRAKRRWAPI 
DTGNLFCTRP 
EVLESSRPGT 
LDREWDKYS 
VEILRIPIED 
VMLEIGVNNE 
NGYKAYDPEN 
A I DKDDRS CT 
SLPNTSPEIS 
CTHPTQCRAT 
NLIISNTEAP 
SCRGAGHHHT 



21 



TLVIFSRDGE 
TARAVAL SDK 
PCSMQENSLG 
VDREEYDVFD 
TVGWCATDR 
LIMKVQDMDG 
KDLINTANWR 
APFARDIPRV 
RNGNGIiRYKK 
GTLAVNIEDV 
RLWSLTKVND 
SRSTGVILGK 
GDDRVCSANG 
LDSCRGGHTE 



31 
I 

ACKKVILNVP 
KRSFTIWLSD 
PFPIjFLQQVE 
IiIAYASTADG 
DEPDTMHTRIi 
QFFGLIGTST 
VNFT I LKGNE 
TALNRALVTV 
LHDPKGWITI 
NDNPPEILQE 
TAARXiSYQKN 
WAILAILLGI 
FMTQTTNNSS 
VDNCRYTYSE 



41 
I 

SKLEADKI IG 
KRKQTQKEVT 
SDAAQNYTVF 
YSADLPLPLP 
KYSILQQTPR 
CI ITVTDSND 
NGHFKISTDK 
HVRDLDEGPE 
DEISGSIITS 
YWICKPKMG 
AGFQEYTIPI 
ALLFSVLLTL 
QGFCGTMGSG 
WHSFTQPRLG 



51 
I 

RVNLEECFRS 
VLLEHQKKVS 
YSISGRGVDK 
IRVEDENDNH 
SPGLFSVHPS 
NAPTFRQNAY 
ETNEGVLSW 
CTPAAQYVRI 
KILDREVETP 
YTDIIiAVDPD 
TVKDRAGQAA 
VCGVFGATKG 
MKNGGQETIE 
EESIRGHTG 



3360 
3420 
3480 
3540 
3600 
3660 
3720 
3780 
3840 
3900 
3960 
4020 
4080 
4140 
4200 
4260 
4320 
4380 
4440 
4500 
4560 
4620 
4680 
4740 
4800 
4860 
4920 
4980 
5040 
5100 
5160 
5220 
5280 
5340 
5400 
5460 
5520 
5580 
5640 
5700 
5760 
5820 
5880 
5940 
6000 
6060 
6120 
6180 
6240 
6300 
6360 
6420 
6480 
6540 
6600 
6660 
6720 
6780 
6840 
6900 
6960 
7020 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
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Seq ID NO: 35 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 146-1273- 
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1 11 21 31 41 51 

I I 1 1 I I 

GGGAGTGGGC GTGGCGGTGC TGCCCAGGTG AGCCACCGCT GCTTCTGCCC AGACACGGTC 60 

5 GCCTCCACAT CCAGGTCTTT GTGCTCCTCG CTTGCCTGTT CCTTTTCCAC GCATTTTCCA 120 

GGATAACTGT GACTCCAGGC CCGCAATGGA TGCCCTGCAA CTAGCAAATT CGGCTTTTGC 180 

CGTTGATCTG TTCAAACAAC TATGTGAAAA GGAGCCACTG GGCAATGTCC TCTTCTCTCC 240 

AATCTGTCTC TCCACCTCTC TGTCACTTGC TCAAGTGGGT GCTAAAGGTG ACACTGCAAA 3 00 

TGAAAT TGGA CAGGTTCTTC ATTTTGAAAA TGT CAAAGAT ATACCCTTTG GATTTCAAAC 360 

10 AGTAACATCG GATGTAAACA AACTTAGTTC CTTTTACTCA CTGAAACTAA TCAAGCGGCT 420 

CTACGTAGAC AAATCTCTGA ATCTTTCTAC AGAGTT CATC AGCTCTACGA AGAGACCCTA 480 

TGCAAAGGAA TTGGAAACTG TTGACTTCAA AGATAAATTG GAAGAAACGA AAGGTCAGAT 540 

CAACAACTCA ATTAAGGATC TCACAGATGG CCACTTTGAG AACATTTTAG CTGACAACAG 600 

TGTGAACGAC CAGACCAAAA TCCTTGTGGT TAATGCTGCC TACTTTGTTG GCAAGTGGAT 660 

15 GAAGAAATTT CCTGAAT GAG AAACAAAAGA ATGTCCTTTC AGACTCAACA AGACAGACAC 72 0 

CAAACCAGTG CAGATGATGA ACATGGAGGC CACGTTCTGT ATGGGAAACA TTGACAGTAT 780 

CAATTGTAAG AT CAT AGAGC TTCCTTTTCA AAATAAGCAT CTCAGCATGT TCATCCTACT 840 

ACCCAAGGAT GTGGAGGATG AGTCCACAGG CTTGGAGAAG ATTGAAAAAC AACTCAACTC 900 

AGAGTCACTG TCACAGTGGA CTAATCCCAG CACCATGGCC AATGCCAAGG TCAAACTCTC 960 

20 CATTCCAAAA TTTAAGGTGG AAAAGATGAT TGATCCCAAG GCTTGTCTGG AAAATCTAGG 102 0 

GCTGAAACAT ATCTTCAGTG AAGACACATC TGATTTCTCT GGAATGTCAG AGACCAAGGG 1080 

AGTGGCCCTA TCAAATGTTA TCCACAAAGT GTGCTTAGAA ATAACTGAAG ATGGTGGGGA 1140 

TTCCATAGAG GTGCCAGGAG CACGGATCCT GCAGCACAAG GATGAATTGA ATGCTGACCA 1200 

TCCCTTTATT TACATCAT CA GGCACAACAA AACTCGAAAC ATCATTTTCT TTGGCAAATT 12 60 

25 CTGTTCTCCT TAAGTGGCAT AGCCCATGTT AAGTCCTCCC TGACTTTTCT GTGGATGCCG 1320 

ATTTCTGTAA ACTCTG CATC CAGAGATTCA TTTTCTAGAT ACAATAAATT GCTAATGTTG 1380 

CTGGAT CAGG AAGCCGCCAG TACTTGTCAT ATGTAGCCTT CACACAGATA GACCTTTTTT 1440 

TTTTTCCAAT TCTATCTTTT GTTTCCTTTT TTCCCATAAG ACAATGACAT ACGCTTTTAA 1500 

TGAAAAGGAA TCACGTTAGA GGAAAAATAT TTATT CATTA TTTGTCAAAT TGTCCGGGGT 1560 

30 AGTTGGCAGA AATACAGTCT TCCACAAAGA AAATTCCTAT AAGGAAGATT TGGAAGCT CT 1620 

TCTTCCCAGC ACTATGCTTT CCTTCTTTGG GATAGAGAAT GTTCCAGACA TTCTCGCTTC 1680 

CCTGAAAGAC TGAAGAAAGT GTAGTGCATG GGACCCACGA AACTGCCCTG GCTCCAGTGA 1740 

AACTTGGGCA CATGCT CAGG CTACTATAGG TCCAGAAGTC CTTATGTTAA GCCCTGGCAG 1800 

GCAGGTGTTT ATTAAAATTC TGAATTTTGG GGATTTTCAA AAGATAATAT TT TAG ATACA 1860 

35 CTGTATGTTA TAGAACTTCA TGGATCAGAT CTGGGGCAGC AACCTATAAA TCAACACCTT 1920 

AATATGCTGC AACAAAATGT AGAATATTCA GACAAAATGG ATACATAAAG ACTAAGTAGC 1980 

CCATAAGGGG TCAAAATTTG CTGCCAAATG CGTATGCCAC CAACTTACAA AAACACTTCG 2040 

TTCGCAGAGC TTTTCAGATT GTGGAATGTT GGATAAGGAA TTATAGACCT CTAGTAGCTG 2100 

AAATG CAAGA CCCCAAGAGG AAGTTCAGAT CTTAATATAA ATTCACTTTC ATTTTTGATA 2160 

40 GCTGTCCCAT CTGGT CATGT GGTTGGCACT AGACTGGTGG CAGGGGCTTC TAGCTGACTC 2220 

GCACAGGGAT TCTCACAATA GCCGATATCA GAATTTGTGT TGAAGGAACT TGTCTCTTCA 2280 

TCTAATATGA TAGCGGGAAA AGGAGAGGAA ACTACTGCCT TTAGAAAATA TAAGTAAAGT 2340 

GATTAAAGTG CTCACGTTAC CTTGACACAT AGTTTTTCAG TCTATGGGTT TAGTTACTTT 2400 

AGATGGCAAG CATGT AACTT ATATTAATAG TAATTTGTAA AGTTGGGTGG ATAAGCTATC 2460 

45 CCTGTTGCCG GTTCATGGAT TACTTCTCTA TAAAAAATAT ATATTTACCA AAAAATTTTG 2 520 

TGACATTCCT TCTCCCATCT CTTCCTTGAC ATGCATTGTA AATAGGTTCT TCTTGTTCTG 2580 
AGATTCAATA TTGAATTTCT CCTATGCTAT TGACAATAAA ATATTATTGA ACTACC 

Seq ID NO: 36 Protein sequence: 
50 Protein Accession #: NP_002630.l 

1 11 21 31 41 51 

lli.lt 

MDALQLANSA FAVDLFKQLC EKEPLGNVLF SPICLSTSLS LAQVGAKGDT ANEIGQVLHF 60 

55 ENVKDIPFGF QTVTSDVNKL SSFYSLKLIK RLYVDKSLNL STEFISSTKR PYAKELETVD 120 

FKDKLEETKG QINNSIKDLT DGHFENILAD NSVNDQTKIL WNAAYFVGK WMKKFPESET 180 

KECPFRLNKT DTKPVQMMNM EATFCMGNID SINCKIIELP FQNKHLSMFI LLPKDVEDES 240 

TGLEKIEKQL NSESLSQWTN PSTMANAKVK LSIPKFKVEK MIDPKACLEN LGLKHIFSED 300 

TSDFSGMSET KGVALSNVIH KVCLEITEDG GDSIEVPGAR ILQHKDELNA DHPFIYIIRH 360 
60 NKTRNIIFFG KFCSP 



Seq ID NO: 37 DNA sequence 
Nucleic Acid Accession #: NM_0168583 
65 Coding sequence: 72-842 

1 11 21 31 41 51 

l I l I I l 

GGAGTGGGGG AGAGAGAGGA GACCAGGACA GCTGCTGAGA CCTCTAAGAA GTCCAGATAC 60 

70 TAAGAGCAAA GATGTTTCAA ACTGGGGGCC TCATTGTCTT CTACGGGCTG TTAGCCCAGA 120 

CCATGGCCCA GTTTGGAGGC CTGCCCGTGC CCCTGGACCA GACCCTGCCC TTGAATGTGA 180 

ATCCAGCCCT GCCCTTGAGT CCCACAGGTC TTGCAGGAAG CTTGACAAAT GCCCTCAGCA 240 

ATGGCCTGCT GTCTGGGGGC CTGTTGGGCA TTCTGGAAAA CCTTCCGCTC CTGGACATCC 300 

TGAAGCCTGG AGGAGGTACT TCTGGTGGCC TCCTTGGGGG ACTGCTTGGA AAAGTGACGT 360 

75 CAGTGATTCC TGGCCTGAAC AACATCATTG ACATAAAGGT CACTGACCCC CAGCTGCTGG 420 

AACTTGGCCT TGTGCAGAGC CCTGATGGCC ACCGTCTCTA TGTCACCATC CCTCTCGGCA 480 

TAAAGCTCCA AGTGAATACG CCCCTGGTCG GTGCAAGTCT GTTGAGGCTG GCTGTGAAGC 540 

TGGACATCAC TGCAGAAATC TTAGCTGTGA GAGATAAGCA GGAGAGGATC CACCTGGTCC 600 

TTGGTGACTG CACCCATTCC CCTGGAAGCC TGCAAATTTC TCTGCTTGAT GGACTTGGCC 660 

80 CCCTCCCCAT TCAAGGTCTT CTGGACAGCC TCACAGGGAT CTTGAATAAA GTCCTGCCTG 720 

AGTTGGTTCA GGGCAACGTG TGCCCTCTGG TCAATGAGGT TCTCAGAGGC T TGGA CAT CA 780 

CCCTGGTGCA TGACATTGTT AACATGCTGA TCCACGGACT ACAGTTTGTC ATCAAGGT CT 840 

AAGCCTTCCA GGAAGGGGCT GGCCTCTGCT GAGCTGCTTC CCAGTGCTCA CAGATGGCTG 900 

GCCCATGTGC TGGAAGATGA CACAGTTGCC TTCTCTCCGA GGAACCTGCC CCCTCTCCTT 960 

85 TCCCACCAGG CGTGTGTAAC ATCCCATGTG CCTCACCTAA TAAAATGGCT CTTCTTCTGC 1020 
AAAAAAAAAA AAAAAAAAAA AAAAAAAAA 



203 



WO 02/086443 

Seq ID NOt 38 Protein sequence: 
Protein Accession #: NP 057667 



PCT/US02/12476 



10 



1 11 21 31 41 51 

I I I I I I 

MFQTGGLIVF YGLLAQTMAQ FGGLPVPLDQ TLPLNVNPAIi PLSPTGLAGS LTNALSNGLL 60 

SGGLLGILEN LPLLDILKPG GGTSGGLLGG LLGKVTSVIP GLNNI IDIKV TDPQLLELGL 120 

VQSPDGHRLY VTIPLGIKLQ VNTPLVGASL LRLAVKLDIT AEILAVRDKQ ERIHLVLGDC 180 

THSPGSLQIS LLDGLGPLPI QGLLDSLTGI LNKVLPELVQ GNVCPLVNEV LRGLDITLVH 240 
D I VNMLi I HGL QFVIKV 



15 



Seq ID NO: 3 9 DNA sequence 

Nucleic Acid Accession #: NM_0043 63.1 

Coding sequence: 115-2223 



20 



25 



30 



35 



40 



45 



50 



55 



60 



65 



70 



75 



80 



11 



21 



CTCAGGGCAG 

TCCTGGAACT 

TCTCCCTCGG 

TCACTTCTAA 

TTCAATGTCG 

TTTGGCTACA 

GTAATAGGAA 

CCCAATGCAT 

CACGTCATAA 

GAGCTGCCCA 

GTGGCCTTCA 

CAGAGCCTCC 

TTCAATGTCA 

GCCAGGCGCA 

TCCCCTCTAA 

TCTAACCCAC 

GAGCTCTTTA 

AACTCAGACA 

CCCAAACCCT 

TTAACCTGTG 

CTCCCGGTCA 

GTCACAAGGA 

CACAGCGACC 

TCATACACCT 

CCACCTGCAC 

TTTATCTCCA 

GCCAGTGGCC 

CCCTCCATCT 

TGTGAACCTG 

GTCAGTCCCA 

AGAAATGACG 

GACCCAGTCA 

TCGTCTTACC 

CCGCAGTATT 

GCCAAAATCA 

GGCCGCAATA 

CTCTCAGCTG 

TAGCAGCCCT 

TAAAGCATTT 

AGACTCTGAC 

AAATACAAAA 

TGAGGCAGGA 

ACTGCACTCC 

TCTGACCTGT 

AACTTTAATG 

TAATTAATTT 

TTCCCAGATT 

AAATATACTT 

AGACTTGGGA 

TCAATAAAAA 



AGGGAGGAAG 

CAAGCTCTTC 

CCCCTCCGCA 

CCTTCTGGAA 

CAGAGGGGAA 

GCTGGTACAA 

CTCAACAAGC 

CCCTGCTGAT 

AGTCAGATCT 

AGCCCTCCAT 

CCTGTGAACC 

CGGTCAGTCC 

CAAGAAATGA 

GTGATTCAGT 

ACACATCTTA 

CTGCACAGTA 

TCCCCAACAT 

CTGGCCTCAA 

TCATCACCAG 

AACCTGAGAT 

GTCCCAGGCT 

ATGATGTAGG 

CAGTCATCCT 

ATTACCGTCC 

AGTATTCTTG 

ACATCACTGA 

ACAGCAGGAC 

CCAGCAACAA 

AGGCTCAGAA 

GGCTGCAGCT 

CAAGAGCCTA 

CCCTGGATGT 

TTTCGGGAGC 

CTTGGCGTAT 

CGCCAAATAA 

AT TCCATAGT 

GGGCCACTGT 

GGTGTAGTTT 

GCAACAGCTA 

C AG AG AT CG A 

ATGAGCTGGG 

GAATCGCTTG 

AGTCTGGCAA 

ACTCTTGAAT 

AACTAACTGA 

CATGGGACTA 

TCAGGAAACT 

TTGTGAACAA 

AACTATTCAT 

TCTGCTCTTT 



GACAGCAGAC 
TCCACAGAGG 
CAGATGGTGC 
CCCGCCCACC 
GGAGGTGCTT 
AGGTGAAAGA 
TACCCCAGGG 
CCAGAACATC 
TGTGAATGAA 
CTCCAGCAAC 
TGAGACTCAG 
CAGGCTGCAG 
CACAGCAAGC 
CATCCTGAAT 
CAGAT CAGGG 
CTCTTGGTTT 
CACTGTGAAT 
TAGGACCACA 
CAACAACTCC 
T C AG AACAC A 
GCAGCTGTCC 
ACCCTATGAG 
GAATGTCCTC 
AGGGGTGAAC 
GCTGATTGAT 
GAAGAACAGC 
TACAGTCAAG 
CTCCAAACCC 
CACAACCTAC 
GTCCAATGGC 
TGTATGTGGA 
CCTCTATGGG 
GAACCTCAAC 
CAATGGGATA 
TAACGGGACC 
CAAGAGCAT C 
CGGCATCATG 
CTTCATTTCA 
CAGTCTAAAA 
GACCATCCTA 
CTTGGTGGCG 
AACCCGGGAG 
CAGAGCAAGA 
ACAAGTTTCT 
CAGCTTCATG 
AATGAACTAA 
TTTTTTCTTT 
AAATTGAGAC 
GAATATTTAT 
GTATAACAGA 



31 
I 

CAGACAGT C A 

AGGACAGAGC 

ATCCCCTGGC 

ACTGCCAAGC 

CTACTTGTCC 

GTGGATGGCA 

CCCGCATACA 

AT CCAGAATG 

GAAGCAACTG 

AACTCCAAAC 

GACGCAACCT 

CTGTCCAATG 

TACAAATGTG 

GTCCTCTATG 

GAAAATCTGA 

GTCAATGGGA 

AATAGTGGAT 

GTCACGACGA 

AACCCCGTGG 

ACCTACCTGT 

AATGACAACA 

TGTGGAATCC 

TATGGCCCAG 

CTCAGCCTCT 

GGGAACATCC 

GGACTCTATA 

ACAATCACAG 

GTGGAGGACA 

CTGTGGTGGG 

AACAGGACCC 

ATCCAGAACT 

CCGGACACCC 

CTCTCCTGCC 

CCGCAGCAAC 

TATGCCTGTT 

ACAGTCTCTG 

ATTGGAGTGC 

GGAAGACTGA 

TTGCTTCTTT 

GCCAACATCG 

CGCACCTGTA 

GTGGAGATTG 

CTCCATCTCA 

GATACCACTG 

AAACTGTCCA 

TGAGGATTGC 

TAAGCTATCC 

ATTTACATTT 

ATTGTATGGT 

AAAA 



41 
I 

CAGCAGCCTT 

AGACAGCAGA 

AGAGGCTCCT 

TCACTATTGA 

ACAATCTGCC 

ACCGTCAAAT 

GTGGTCGAGA 

ACACAGGATT 

GCCAGTTCCG 

CCGTGGAGGA 

ACCTGTGGTG 

GCAACAGGAC 

AAACCCAGAA 

GCCCGGATGC 

ACCTCTCCTG 

CTTTCCAGCA 

CCTATACGTG 

TCACAGTCTA 

AGGATGAGGA 

GGTGGGTAAA 

GGACCCTCAC 

AGAACGAATT 

ACGACCCCAC 

CCTGGCATGC 

AGCAACACAC 

CCTGCCAGGC 

TCTCTGCGGA 

AGGATGCTGT 

TAAATGGTCA 

T CACTCT ATT 

CAGTGAGTGC 

CCATCATTTC 

ACTCGGCCTC 

ACACACAAGT 

TTGTCTCTAA 

CATCTGGAAC 

TGGTTGGGGT 

CAGTTGTTTT 

ACCAAGGATA 

TGAAACCCCA 

GTCCCAGTTA 

CAGTGAGCCC 

AAAAGAAAAG 

CACTGTCTGA 

CCAAGATCAA 

TGATTCTTTA 

ACTCTTACAG 

TCTCCCTATG 

AATATAGTTA 



51 
I 

GACAAAACGT 

GACCATGGAG 

GCTCACAGCC 

ATCCACGCCG 

CCAGCATCTT 

TATAGGATAT 

GATAATATAC 

CTACACCCTA 

GGTATACCCG 

CAAGGATGCT 

GGTAAACAAT 

CCTCACTCTA 

CCCAGTGAGT 

CCCCACCATT 

CCACGCAGCC 

ATCCACCCAA 

CCAAGCCCAT 

TGCAGAGCCA 

TGCTGTAGCC 

TAATCAGAGC 

TCTACTCAGT 

AAGTGTTGAC 

CATTTCCCCC 

AGCCTCTAAC 

ACAAGAGCTC 

CAATAACTCA 

GCTGCCCAAG 

GGCCTTCACC 

GAGCCTCCCA 

CAATGTCACA 

AAACCGCAGT 

CCCCCCAGAC 

TAACCCATCC 

TCTCTTTATC 

CTTGGCTACT 

TTCTCCTGGT 

TGCTCTGATA 

GCTTCTTCCT 

TTTACAGAAA 

TCTCTACTAA 

CTCGGGAGGC 

AGATCGCACC 

AAAAGAAGAC 

GAATTTCCAA 

G CAG AG AAAA 

AATGT CTTGT 

CAATTTGATA 

TGGTCGCTCC 

TTGCACAAGT 



Seq ID NO: 40 Protein sequence: 
Protein Accession #: NP_ 004354.1 



85 



MESPSAPPHR 
HLFGYSWYKG 
TLHVIKSDLV 
NNQSLPVSPR 
TISPLNTSYR 
AHNSDTGLNR 
QSLPVSPRLQ 
SPSYTYYRPG 
NSASGHSRTT 
IjPVSPRLQLS 
PDSSYLSGAN 
ATGRNNSIVK 



11 
I 

WCIPWQRLLL 
ERVDGNRQII 
NEEATGQFRV 
LQLSNGNRTL 
SGENLNLSCH 
TTVTTITVYA 
LSNDNRTDTL 
VNLSLSCHAA 
VKTI TVSAEL 
NGNRTLTLFN 
LNLSCHSASN 
SITVSASGTS 



21 

1 

TASLLTFWNP 
GYVIGTQQAT 
YPELPKPSIS 
TLFNVTRNDT 
AASNPPAQYS 
EPPKPFITSN 
LSVTRNDVGP 
SNPPAQYSWL 
PKPSISSNNS 
VTRNDARAYV 
PSPQYSWRIN 
PGLSAGATVG 



31 
I 

PTTAKLTIES 
PGPAYSGRE I 
SNNSKPVEDK 
ASYKCETQNP 
WFVNGTFQQS 
NSNPVEDEDA 
YECGIQNELS 
IDGNIQQHTQ 
KPVEDKDAVA 
CGIQNSVSAN 
GIPQQHTQVL 
IMIGVLVGVA 



41 
I 

TPFNVAEGKE 
IYPNASLLIQ 
DAVAFTCEPE 
VSARRSDSVI 
TQELFIPNIT 
VALTCEPEIQ 
VDHSDPVILN 
ELFISNITEK 
FTCEPEAQNT 
RSDPVTLDVL 
FIAKITPNNN 
LI 



51 
I 

VLLLVHNLPQ 
NIIQNDTGFY 
TQDATYLWWV 
LNVLYGPDAP 
VNNSGSYTCQ 
NTTYLWWVNN 
VLYGPDDPTI 
NSGLYTCQAN 
TYLWWVNGQS 
YGPDTPIISP 
GTYACFVSNL 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 



204 



WO 02/086443 



PCT/US02/12476 



Seq ID NO: 41 DNA sequence 

Nucleic Acid Accession #: NM_006952.1 

Coding sequence: 11-793 

1 11 21 31 . 41 51 

1 I I I I I 

AATCCCGACA ATGGCGAAAG ACAACTCAAC TGTTCGTTGC TTCCAGGGCC TGCTGATTTT 60 

TGGAAATGTG ATTATTGGTT GTTGCGGCAT TGCCCTGACT GCGGAGTGCA TCTTCTTTGT 120 

10 ATCTGACCAA CACAGCCTCT ACCCACTGCT TGAAGCCACC GACAACGATG ACATCTATGG 180 

GGCTGCCTGG ATCGGCATAT TTGTGGGCAT CTGCCTCTTC TGCCTGTCTG TTCTAGGCAT 240 

TGTAGGCATC ATGAAGTCCA GCAGGAAAAT TCTTCTGGCG TATTTCATTC TGATGTTTAT 300 

AGTATATGCC TTTGAAGTGG CATCTTGTAT CACAGCAGCA ACACAACGAG ACTTTTTCAC 3 60 

ACCCAACCTC TTCCTGAAGC AGATGCTAGA GAGGTACCAA AACAACAGCC CTCCAAACAA 42 0 

15 TGATGACCAG TGGAAAAACA ATGGAGTCAC CAAAACCTGG GACAGGCTCA TGCTCCAGGA 480 

CAATTGCTGT GGCGTAAATG GTCCAT CAGA CTGGCAAAAA TACACATCTG CCTTCCGGAC 540 

TGAGAATAAT GATGCTGACT ATCCCTGGCC TCGTCAATGC TGTGTTATGA ACAATCTTAA 600 

AGAACCTCTC AACCTGGAGG CTTGTAAACT AGGCGTGCCT GGTTTTTATC ACAAT CAGGG 660 

CTGCTATGAA CTGATCTCTG GTCCAATGAA CCGACACGCC TGGGGGGTTG CCTGGTTTGG 720 

20 AT TTGCCATT CTCTGCTGGA CTTTTTGGGT TCTCCTGGGT ACCATGTTCT ACTGGAGCAG 7 80 

AAT TGAATAT TAAGAA 



25 



Seq ID NO: 42 Protein sequence: 
Protein Accession #: NP 008883.1 



11 21 31 41 51 

1 I 1 1 I 

MAKDNSTVRC FQGLLIFGNV IIGCCGIALT AECIFFVSDQ HSLYPLLEAT DNDD I YGAAW 60 

IGIFVGICLF CLSVLGIVGI MKSSRKILLA YFILMFIVYA FEVASCITAA TQRDFFTPNL 12 0 

30 FLKQMLERYQ NNSPPNNDDQ WKNNGVTKTW DRLMLQDNCC GVNGPSDWQK YTSAFRTENN 180 

DADYPWPRQC CVMNNLKEPL NLEACKLGVP GFYHNQGCYE LISGPMNRHA WGVAWFGFAI 240 

LCWTFWVLLG TMFYWSRIEY 

35 Seq ID NO: 43 DNA sequence 

Nucleic Acid Accession #: Eos sequence 
Coding sequence: 83-2 6 05 

1 11 21 31 41 51 

40 i | | | 



GCCGGACAGA TCTGCGCGTA TCCTGGAGCC GGCCCAGTTG TGAACTAGGA GAGCTTTGGG 60 

ACCTCTGTCC CAAGCAAGAG AGATGAATGG AGAGTATAGA GGCAGAGGAT TTGGACGAGG 120 

AAGATTTCAA AGCTGGAAAA GGGGAAGAGG TGGTGGGAAC TTCT CAGGAA AATGGAGAGA 180 

AAGAGAACAC AGACCTGATC TGAGTAAAAC CACAGGAAAA CGTACTTCTG AACAAACCCC 240 

45 ACAGTTTTTG CTTTCAACAA AGACCCCACA GTCAATGCAG TCAACATTGG AT CGATTCAT 300 

ACCATATAAA GGCTGGAAGC TTTATTTCTC TGAAGTTTAC AGCGATAGCT CTCCTTTGAT 360 

TGAGAAGATT CAAGCATTTG AAAAATTTTT CACAAGGCAT ATTGATTTGT ATGACAAGGA 420 

TGAAATAGAA AGAAAGGGAA GTATTTTGGT AGATTTTAAA GAACTGACAG AAGGTGGTGA 480 

AGTAACTAAC TTGATACCAG ATATAGCAAC TGAACTAAGA GATGCACCTG AGAAAACCTT 540 

50 GGCTTGCATG GGTTTGGCAA TACATCAGGT GTTAACTAAG GACCTTGAAA GGCATGCAGC 600 

TGAGTTACAA GCCCAGGAAG GATTGTCTAA TGATGGAGAA ACAATGGTAA ATGTGCCACA 660 

TATTCATGCA AGGGTGTACA ACTATGAGCC TTTGACACAG CTCAAGAATG TCAGAGCAAA 720 

TTACTATGGA AAATACATTG CTCTAAGAGG GACAGTGGTT CGTGT CAGTA ATATAAAGCC 780 

TCTTTGCACC AAGATGGCTT TTCTTTGTGC TGCATGTGGA GAAATTCAGA GCTTTCCTCT 840 

55 TCCAGATGGA AAAT ACAGT C TTCCCACAAA GTGTCCTGTG CCTGTGTGTC GAGGCAGGTC 900 

ATTTACTGCT CTCCGCAGCT CTCCTCTCAC AGTTACGATG GACTGGCAGT CAATCAAAAT 960 

CCAGGAATTG ATGTCTGATG ATCAGAGAGA AGCAGGTCGG ATTCCACGAA CAATAGAATG 1020 

TGAGCTTGTT CATGATCTTG TGGATAGCTG TGTCCCGGGA GACACAGTGA CTATTACTGG 1080 

AATTGT CAAA GTCTCAAATG CGGAAGAAGG TTCTCGAAAT AAGAATGACA AGTGTATGTT 1140 

60 CCTTTTGTAT ATTGAAGCAA ATTCTATTAG TAATAGCAAA GGACAGAAAA CAAAGAGTTC 12 0 0 

TGAGGATGGG TGTAAGCATG GAATGTTGAT GGAGTTCTCA CTTAAAGACC TTTATGCCAT 1260 

CCAAGAGATT CAAGCTGAAG AAAACCTGTT TAAACTCATT GTCAACTCGC TTTGCCCTGT 132 0 

CATTTTTGGT CATGAACTTG TTAAAGCAGG TTTGGCATTA GCACTCTTTG GAGGAAGCCA 13 80 

GAAATACGCA GATGACAAAA ACAGAATTCC AATTCGGGGA GACCCCCACA TCCTTGTTGT 1440 

65 TGGAGATCCA GGCCTAGGAA AAAGTCAAAT GCTACAGGCA GCGTGCAATG TTGCCCCACG 1500 

TGGCGTGTAT GTTTGTGGTA ACACCACGAC CACCTCTGGT CTGACGGTAA CTCTTTCAAA 1560 

AGATAGTTCC TCTGGAGATT TTGCTTTGGA AGCTGGTGCC CTGGTACTTG GTGATCAAGG 1620 

TATTTGTGGA ATCGATGAAT TTGATAAGAT GGGGAATCAA CATCAAGCCT TGTTGGAAGC 1680 

CATGGAGCAG CAAAGTATTA GTCTTGCTAA GGCTGGTGTG GTTTGTAGCC TTCCTGCAAG 1740 

70 AACTTCCATT ATTGCTGCTG CAAATCCAGT TGGAGGACAT TACAATAAAG CCAAAACAGT 1800 

TTCTGAGAAT TTAAAAATGG GGAGTGCACT ACTATCCAGA TTTGATTTGG TCTTTATCCT 1860 

GTTAGATACT CCAAATGAGC ATCATGATCA CTTACTCTCT GAACATGTGA TTGCAATAAG 1920 

AGCTGGAAAG CAGAGAACCA TTAGCAGTGC CACAGTAGCT CGTATGAATA GTCAAGATTC 1980 

AAATACTT CC GTACTTGAAG TAGTTTCTGA GAAGCCATTA TCAGAAAGAC TAAAGGTGGT 2 040 

75 TCCTGGAGAA AC AAT AGAT C CCATTCCCCA CCAGCTATTG AGAAAGTACA TTGGCTATGC 2100 

TCGGCAGTAT GTGTACCCAA GGCTATCCAC AGAAGCTGCT CGAGTTCTTC AAGATTTTTA 2160 

CCTTGAGCTC CGGAAACAGA GCCAGAGGTT AAATAGCTCA CCAATCACTA CCAGGCAGCT 2220 

GGAATCTTTG ATTCGTCTGA CAGAGGCACG AGCAAGGTTG GAATTGAGAG AGGAAGCAAC 2280 

CAAAGAAGAC GCTGAGGATA TAGTGGAAAT TATGAAATAT AGCATGCTAG GAACTTACTC 2340 

80 TGATGAATTT GGGAACCTAG ATT TTGAGCG AT CCCAGCAT GGTTCTGGAA TGAGCAACAG 2400 

GTCAACAGCG AAAAGATTTA TTTCTGCTCT CAACAACGTT GCTGAAAGAA CTTATAATAA 2460 

TATATTTCAA TTTCATCAAC TTCGGCAGAT TGCCAAAGAA C T AAA CAT T C AGGTTGCTGA 2520 

TTTTGAAAAT TTTATTGGAT CACTAAATGA CCAGGGTTAC CTCTTGAAAA AAGGCCCAAA 2580 

AGTTTACCAG CTTCAAACTA TGTAAAAGGA CTTCACCAAG TTAGGGCCTC CTGGGTTTAT 2640 

85 TGCAGATTAA AGCCATCTCA GTGAAGATAT GCGTGCACGC ACAGACAGAC AGACACACAC 2700 

ACACACACAC ACACACACAC ACACACACAC ACACACAGTC AAATACTGTT CTCTGAAAAA 2760 

TGATGTCCCA AAAGTATTAT AATAGGAAAA AAG CAT T AAA TATAATAAAC TAATTTAAGA 2820 
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10 



15 



20 



25 



WO 02/086443 

AGTGATAAAG TCTCCAGATG 
GGTGAGAGGA TTCCTTGAGG 
CATTTCTTAA AAAAAAAAAA 
TAGTCTCAGC TACTTGTGAG 
TACAGTGAGC CACAATCACA 
GACTCAAAAA AATAAAAAAA 
CCAAAGGGCT AAAAGTAAAT 
TTATATGTAT GAATATTTCA 
AAACCAATGA ATATATTACA 
ATTTGAATTT CATAAAATTT 
GCTATTTAAT AATAGGTCTC 
AATAGAAACA GACTGATTAA 
AATTATTAGA AGGCAGGTGA 
GCCTTAGAAT TGGACTAAGG 
AGAAAGTGCT GCTGCCTCCC 
GAATGCCCCC ACCCGCACCG 
ATTGCTGAAT TCAAAAAAGA 
TATGCCCCTT TCATAGGCTG 
AATAAGACCA GAATTTCTCA 
AAACTAT CAA TCATGTATAA 
GTGAACCATT GTTGGAGAAT 
AATGTAAATA AAAAGAACTG 
GATGTGGAGA CTATTGCCAT 
GGAAT CAAAA GGGGCCAGGT 
GAGGCAGGAG GATCACTTGA 
TATCTCTACA AAAAATAGAT 
GTGGAGGCTG AAGTAGGAAA 
TTATACCACT GCACTCCAGC 



PCT/US02/12476 



CAGTAGCTCA 
CCAGGGTTCG 
AAAAAATTTA 
GCTGAGGCAG 
CCAAT CACTG 
ATTGTAGTGG 
TACTTATAAA 
TAGTTTTGCA 
TATTCTGTGT 
TCCCATGTCA 
ATTTATTCCA 
GCAGGAGAAG 
ACCAGGAGGG 
AAGAAGCTGC 
TGCCCCACCT 
GAACAGCAAC 
AGTTGCATAC 
CTAGGGAGTT 
TATGTTGTGA 
AT C CAAC AAA 
CTACTAAAAT 
GCAGTGTATA 
AGACCACAAT 
GCAGTGGCTC 
AGCCAGTTTT 
TAGCTGGGCA 
TCACTTGAGC 
CTGGGCAAGA 



CACTGTAATC 
AGACCAACCT 
AACTTAGCTG 
GAGGATT CTT 
CACTCCAGCC 
TAGCCATGTG 
TTTTTTATAG 
TATCAGATGT 
T CCAAT AAAA 
AGAATACAAA 
CAGGCTGTAG 
TTTTTTGAAA 
TAAGCTTCCA 
TGACACTCCA 
TTGCCACTTC 
AAAAGGATTC 
AAAGACATCT 
TTCCTGGTTC 
GAGGAT TCAA 
CACTTTGTAA 
ACGGCTTCCC 
TCAGATGTTT 
GTAAATTTTT 
ACATCTATAA 
GAGACCAGCC 
CGGTGGTGCA 
CCGAGAGTTT 
GAGCAAGACC 



ACAGTGACTC 
TGGGCAACAT 
GGTATGGTGG 
TGAGCCCAGG 
TGGGCAATAA 
TTAATTGTTA 
TTGTATTTTT 
AGGCATACAG 
CTTTATTTAT 
ATACTTGAGT 
TTTGTAGTCT 
GAATTTTGTT 
GCAGCAATTT 
CTGCCACACA 
TGCAGCAGGA 
TGCATGAGAT 
GATTGAAAAA 
TACTTTCAGG 
ATGTTACAGG 
CATACAAGAA 
GCAAACGAAG 
AACTATAGGA 
AAGTGAGGAA 
TCCCAGAGCT 
TATGCAACAC 
TGCCTATTGT 
GAGGTTACAG 
TTGTCTCTT 



AGGAGGCTGA 2880 

AGCAAGACCC 2940 

CACATGCCTA 3000 

AGTTTGAGGT 3060 

AGTAACTCTT 3120 

AATAAATTCT 3180 

GACCTGCCTT 3240 

ACAAATACAT 3300 

GGACACTAAA 3360 

TTTGTTTTTA 3420 

TGCTTGAAAC 3480 

TGGCTCACGG 3540 

GTAAAACCAT 3 600 

GGGCACTGGA 3660 

ATAGGTAGAA 372 0 

GCCTCCCTAA 3780 

GGGTATGTTA 3840 

TGGTGGGATC 3 900 

GTTGCCAGCC 3 960 

CTCAGGAAAT 4020 

ATGAATGGAA 4080 

CCAGAACTAA 4140 

GGAAAAATCA 4200 

TTGGGAGTTC 42 60 

ATTGAGACCC 4320 

CCTACCTACT 43 80 

TGAGCTATGA 4440 



30 



Seq ID NO: 44 Protein sequence : 
Protein Accession ft: CAB55276.2 



35 



40 



45 



50 



55 



60 



65 



70 



75 



1 
I 

MNGEYRGRGF 
TPQSMQSTLD 
ILVDFKELTE 
L SNDGETMVN 
LCAACGEIQS 
QREAGRIPRT 
SISNSKGQKT 
KAGLALALFG 
TTTTSGLTVT 
LAKAGWCSL 
HDHLLSEHVI 
IPHQLLRKYI 
EARARLELRE 
SALNNVAERT 



11 

I 

GRGRFQSWKR 
RF I PYKGWKL 
GGEVTNLIPD 
VPHIHARVYN 
FPLPDGKYSL 
IECELVHDLV 
KSSEDGCKHG 
GSQKYADDKN 
LSKDSSSGDF 
PARTS I IAAA 
AIRAGKQRTI 
GYARQYVYPR 
EATKEDAED I 
YNNIFQFHQL 



21 
i 

GRGGGNFSGK 
YFSEVYSDSS 
IATELRDAPE 
YEPLTQLKNV 
PTKCPVPVCR 
DSCVPGDTVT 
MLMEFSLKDL 
RIPIRGDPHI 
ALEAGALVLG 
NPVGGHYNKA 
SSATVARMNS 
LSTEAARVLQ 
VEIMKYSMLG 
RQIAKELNIQ 



31 

! 

WREREHRPDL 
PLIEKIQAFE 
KTLACMGLAI 
RANYYGKYIA 
GRSFTALRSS 
ITGIVKVSNA 
YAIQEIQAEE 
LWGDPGLGK 
DQGICGIDEF 
KTVSENLKMG 
QDSNTSVLEV 
DFYLELRKQS 
TYSDEFGNLD 
VADFENFIGS 



41 
I 

SKTTGKRTSE 
KFFTRHIDLY 
HQVLTKDLER 
LRGTWRVSN 
PLTVTMDWQS 
EEGSRNKNDK 
NLFKLIVNSL 
SQMLQAACNV 
DKMGNQHQAL 
SALLSRFDLV 
VSEKPLSERL 
QRLNSSPITT 
FERSQHGSGM 
LNDQGYLLKK 



51 
I 

QTPQFLLSTK 
DKDE I ERKGS 
HAAELQAQEG 
I KPLCTKMAF 
IKIQELMSDD 
CMFLLYIEAN 
CPVIFGHELV 
APRGVYVCGN 
LEAMEQQSIS 
FILLDTPNEH 
KWPGETIDP 
RQLESLIRLT 
SNRSTAKRFI 
GPKVYQLQTM 



Seq ID NO: 45 DNA sequence 

Nucleic Acid Accession #: NM_005416.1 

Coding sequence: 149.. 658 



ACCAGATCCC 
CTGAAGACCA 
AAAGAGTGTG 
CCCACCACCT 
AATATTTGTT 
AAAGATTCCA 
GCCAGGCTGT 
CAAGGTCCCT 
ACCAGGCAGC 
CAAAGTTCCT 
GCCATGTCCT 
TGGTGCACAG 
TGTTT CTGTG 
AGTCTCTCTC 
CTGAAGAATC 
GGCTGCTCAG 
CTCATTAAAT 



11 

! 

AGAGGCTGAA 
GAAAAGCCAC 
TCCACGATCC 
CAGCTTCAAC 
CCCACAACCA 
GAGCCAGGCT 
ACCAAGGTCC 
GAGCCAGGTT 
ATCAAGGTCC 
GAGCAAGGAT 
TCAACGGTCA 
ACAAGCCCTT 
TCTTAATTGT 
TTATTTGTAT 
CTGTAAGCCC 
GGTTCATCTG 
TGCTTTTAAT 



21 
I 

CACCTCGACC 
TAAGACTTTC 
TTTGAAGCAT 
AGCAGCAGGT 
AGGAGCCATG 
GTACCAAGGT 
CTGAGCCAGG 
GTACCAAGGT 
CTGACCAAGG 
ACACCAAAGT 
CTCCAGGCCC 
GAGAAGCCAA 
CTGTAGACCT 
CCTAAAAATA 
CTGAATTAAG 
AAGATTCGAA 
TCCA 



31 
I 

TTCTCTGCAC 
TGCTTAATTC 
GAGTT CTT AC 
GAAACAACCC 
CCACTCAAAG 
CCCTGAGCCA 
TTGTACCAAG 
CCCTGAGCCA 
CTTCATCAAG 
TCCTGTGCCA 
AGCTCAGCAG 
CCACCAGATG 
TGTAATCAGC 
CGTACTATAA 
CAGAAAGTCT 
TGAAAAGAAA 



41 
I 

AGCAGATGAT 
AGGAGCTTAG 
CAGCAGAAGC 
AGCCAGCCTC 
GTTCCACAAC 
GGCTGTACCA 
GTCCCTGAGC 
GGCTACACCA 
TTTCCTGAGC 
GGCTACACAA 
AAGACCAAGC 
CTGGACACCC 
ACATTGTCAC 
AGCTTTTGTT 
TCATGGCTTT 
TGCATGTTTC 



51 
I 

CCCTGAGCAG 
AGGATTCTTC 
AGACCTTTAC 
CACCTCAGGA 
CTGGAAACAC 
AGGTCCCTGA 
CAGGCTGTAC 
AGGTCCCTGA 
CAGGTGCCAT 
AGCTACCAGA 
AGAAGTAATT 
TCTTCCCATC 
CCCAAGCCAT 
CACACACACT 
TCTGGTCTTC 
CTGCTCTTCC 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 



Seq ID NO: 46 Protein sequence: 
Protein Accession #: NP 005407.1 



1 11 21 31 41 51 

80 | | | | I I 

MSSYQQKQTF TPPPQLQQQQ VKQPSQPPPQ EIFVPTTKEP CHSKVPQPGN TKIPEPGCTK 
VPEPGCTKVP EPGCTKVPEP GCTKVPEPGC TKVPEPGCTK VPEPGYTKVP EPGSIKVPDQ 
GFIKFPEPGA IKVPEQGYTK VPVPGYTKLP EPCPSTVTPG PAQQKTKQK 

85 Seq ID NO: 47 DNA sequence 

Nucleic Acid Accession #: Eos sequence 



60 
120 



206 



WO 02/086443 

1 11 21 31 41 SI 

I i I I I I 

GCGTCGTGTG CAGGCGTCCC CGGGCTGTGG ATAATTAGAC ACGTTCTTCC CTCATTGCCC 

AAGGCTCGTT AGAATTCGCC CTAGAGCTGT ATCATGTATT TTCTTTCAAA TTAACTTTGC 

TTGCAATTAA GCTTAGGGAA CCAGCAACAA AAGCAAACTT GGCCCGAGGT CGTTCACCGC 

GAAAATGGAT TAGAGAAACT TCTTCCCCGA TTTAAGGGGA AAGATTCCTG CGGCCAGCGC 

TTTGGGGAAA GTGCCCCGAC CGCAGAGGCG ACGACAGGGG AGCAGGAAGC TGCTCACGGT 

AGT CGGCGTT GGCGGCAGCG GTGGCCTTCC TCATCTGGGC GATGTGGGCT CCTAGAAGAG 

TAAGGATAAC AT CCTGGAAA TGACTTCTGT ACGGTTTGAG CCCAACTGCA CACTCATGAC 

TTGGAGCTGC CCTGTGGAGT TACAGTTTAC CAAACACATT CATGAACATA ATCTCATTTA 

CTAAAAACTT TGTGAGAATT TTCTTTTACT AAAATTTTTT CTTATTACAA A 

Seq ID NO: 4 8 DNA sequence: 

Nucleic Acid Accession #: CAT cluster 



1 11 21 31 41 51 

I 1 I I I I 

TTCCAAATTT TTTTTTTTGT AATAAGAAAA AATTTTAGTA AAAGAAAATT CTCACAAAGT 

TTTTAGTAAA TGAGATTATG TTCATGAATG TGTTTGGTAA ACTGTAACTC CACAGGGCAG 

CTCCAAGTCA TGAGTGTGCA GTTGGGCTCA AACCGTACAG AAGTCATTTC CAGGATGTTA 

TCCTTACTCT TCTCGGAGCC CACATCGCCC AGATGAGGAA GGCCACCGCT GCCGCCAACG 

CCGACTACCG TGAGCAGCTT CCTGCTCCCC TGTCGTCGCC TCTGCGGTCG GGGCACTTTC 

CCCAAAGCGC TGGCCGCAGG AATCTTTCCC CTTAAATCGG GGAAGAAGTT TCTCTAATCC 

ATTTTCGCGG TGAACGACCT CGGGCCAAGT TTGCTTTTGT TGCTGGTTCC CTAAGCTTAA 

TTGCAAGCAA AGTTAATTTG AAAGAAAATA CATGATACAG CTCTAGGGCG AATTCTAACG 

AGCCTTGGGC AATGAGGGAA GAACGTGTCT AGTTATCCAC AGCCCGGGGA CGCCTGCACA 

CGACGCT 

Seq ID NO: 4 9 DNA sequence 

Nucleic Acid Accession #: CAT cluster 

1 11 21 31 41 51 

I ) I I I I 

TCTTTCTTCT GCTGCTCGTT TGTCTCTCCT GTGCTCTTCT TCTTTCTTTC CCTCGCCGCT 

CCTGCCGACC TCTGTTGTCT CTTCTCTGAT GGCGGGGGGC GGGAGAAGCT GACCGGTGAG 

ACCGTAGACC CGAAACCATT GGGTGT CACA AGCCGGTCGC CGGCTTTTTT GGGAGAACCC 

GACACATGCA GACCAGTTTT CCTGGAACNG CATGACCATG TTATTACTAT GGGCCGCCTC 

CCCAACCAAA GTGTTTAAAA CTTTTTAGGG CACCCCCAAA ATTTTTTTTT TTTTTTTTTT 

TTCATTTAAA AAACT CTAAT ATTTATATTA AATACAAAGA TACCCAAACC CTTTATGCTT 

CTTTCTCTGA TCTGTGTCTT TTTTCTTTGA CAGCATCTCG ATTTTTTTTC TGCTGCTTCA 

TCGCTGTAGC CATGGGAATC CGTTT CATTA TTATGGTAGC AATATGGAGT GCTGTATTCC 

TAAAGAAACT GACACAGGAG AATCACTTGA ACTTGGGAGG CAGAGTTTGC AGTGAGCCGA 

GATTGAACCA GTGCACTCCA GCCTTGGCAG CGGAGCAAGA TTCTGTCACA GTTCCTGAAG 

TGCTGGTATC GTCCTGCAGC CCCATCCTCG GTTCCATTGC GCTGCCAGGC AGGGTGCTGG 

GACGTGGGGA GAGCTGGTCT ATATATCCGG GTGAAGCTCA GCTGTGGCAC ACCTTGGATG 

CCGGGTCTCT CCTGGCCCCG GGGACCTAGT ATTTTTGCCA CGAGTGTACA CCAAACAAAG 

GAGACAGCAT CATTTATGAG CCTGCAGCAT CCACCCTACT GCTGTATCCA GTTTCCATTG 

ACTG 



Seq ID NO: 50 DNA sequence 
Nucleic Acid Accession #: L05187 
Coding sequence: 1991.. 2260 



1 11 21 31 41 51 

I I I I I I 

CTGCAGGGAG GCAGGTAGAA AAGGCTTTTG GGTTTTCAGG TGGGGGGCAG TCTAGCCTGA 

TCAGAAAGGA GGAAAAGGCC AGGGCAGATG TCTGGGTGGA GTGAAGGGAA AAAGTGATCC 

CAGAAGAAGG ATTAGCCCCT GAAAGTCCCT GAAGTAGGAG AAGGGTAAAG GTGTGGTTGG 

TGAAGGAAAG CAGGTTTTCC CAGATTAGCA ACCAGTCAGG GGGAGGAAGG TGAGAGTGGG 

AGAGTCATAA GTAAATTATT CTGAATGTGT GTAGTTTAAT GGAATTGGGA AAAAGATGGG 

GGAAATGGAT GGAAGGTCTT GGACTCTGAG ACAAGGGGTC TATAATCAGT CCATTTCATT 

ATTTCTAGCT TCCACCTTCA CCAAGGCAGA CAAGGAGGGC CCACCTCAGC TCCTCTGCTC 

CCCCTCCCTT TCCCACCTAT TCATGTGTGC AAGAGTGCCC TGTCCCACAG AACACGGGGA 

ACAACCATCT CAATGACAAG GACAGCAGGT GGCAAGGCTC AACAGGACTC AGATGTCCCC 

CCAGGGTTAA CTCATGAAAC CCTCCATGAA GCCTGCTGCT CACCCCTCCC TCAAGGCAAG 

CCCTGCACCT GGGT CTGAGG ATGAGGGTGG CAGTGAAAAT TAGGCCAGTG ACATCATTTT 

CAGCCAGCTA GTGCCAAAAA ATATCAGGTG GTGTTCATCA AATAAGCCGA GCCAACCGGT 

GATGAGGATG GTAGTGTGAG TCATGTGTGA CAGGTGAGGA ATGAAAACAG AGTGCCCGAG 

AGCTTCTATT TCCTTGAGGC AGGGCTCATT CATCTTATAA AAGCCAGCTG GCCATTGCCT 

TCACACCAAA CCCAAGGGAC CACACAGCCC ATTCTGCTCC GTATACCAGG TAAGTCTCTG 

ATTGCAACAA ACTGGCAATT CTAGTGTACT TTTTCATTAT TAGAAATTAG CTAAAGGCAA 

ATATGTGTAA GCAGGTTAAT CCAGGGTTTC AATGGGAGAT AGAGAATAGT GGAATATCTT 

TATTTTAAGT TAAATTACAG TCTGGATTTG AAAGGACCTT AGAGATGGTT AGGGCTCCCA 

CCTCAGTAGA TAGTCATTGA ACTGGGAGTC CTGGAGAAGA TTGTTCAAAT GCCCATGGGA 

AGTTCATAGC AGAACTAGAA CTCAGGCCAG AGCACTCTCA GTAACACTGC AATTTCCCCC 

TGACAAGATA TTTATAGAAA TTTTAATTTA TTAGATGGAT CTCTACTGAG CATTTATTCC 

ATTTAAGGCA GTATGCTAGG CACTTTGGAC AAAT CAATGC CCTAACGTAC TTACTTAACA 

AACATAAAAC CTAGCAGGAA GGTAATACAT ATATATAAAT AAATGAAATG CAAAGTAGAT 

AGTAATTGGC ATGACGGAGA TGGGCAGAGA AGGGCTGTGC ACTTTTGGGA GACTTGCTCA 

AGGAGACCTC TAGGGTGTCA AGTGATGTGA GCTATGATGG AGGGGTATTT GGACAAGCAG 

AGATGGGAAG AAAAG CAT T T GGAAGGGACT GTGTAAGCAC AGACCAGAAG CAAAACCATA 

GAGGCTTAGA TGAATATAAA GCCATCCTAT AAGTCACAGG CTTTCTACAT GGTACTAGGA 

GAGGAAAGTG GTCTGATGCC ATTTTCCAAA AGACCTAATA TGCGGACCTC ATGTCCCTCA 

GAAGCCAGCT TTAGTAGGGC ATTTTTCCAG AACAGATATA AGGTGCCTTG GGTAGGAAGG 

GAGCCAAGAA GAGAACTCCA ATAAAATGGA GCAGAAGAAA TTGCCTTTTA GCTCCTCCTC 

TTCAAAGGGC CTGAAAATTA TCCAAGCTTA TTTCATTTTT AAATGTAATG GGGGAGCTAA 



207 



10 



WO 02/086443 

GGGAGATGAA AGGCTTTCTC 
TTGTATCCAT CTTTCTTTAA 
CATTTGAAGC ATGAATTCTC 
GCAGCAGCAG GTGAAACAAC 
CAAGGAGCCC TGCCAACCCA 
CCAGCCCAAG ATTCCAGAGC 
CACTCCAGCA CCAGCCCAGC 
TTGAGGAGCT GGCCACTGGA 
GCCTATTGAC CCTGCAGTTA 
CTAAAAAGAT GTCCCTTACC 
GTCTCACTGA CTGAGCTAGT 
AGGT CAAGTG ACCATCCCTA 



PCT/US02/12476 



TTCTAAAGGG 
TTGAATCACT 
AGCAGCAGAA 
CTTGCCAGCC 
AGGTGCCTGA 
CCTGCCAGCC 
AGAAGACCAA 
TACTGAACAC 
GCATGCTGTC 
CTCATTCTGG 
CTTCTTGTTG 
G 



TCCTGAAATA 
GTGTCAGCTT 
GCAGCCTTGC 
TCCACCCCAG 
GCCCTGCCAC 
CAAGGTGCCT 
GCAGAAGTAA 
CCTACTCCAT 
ACCCTGAATC 
AGGCTCCTGA 
CTCGGGTGCA 



AAATCTGTTT 
TCTGTCTCTA 
ACCCCACCCC 
GAACCATGCA 
CCCAAAGTGC 
GAGCCCTGCC 
TGTGGTCCAC 
TCTGCTTATG 
ATAAT CGCTC 
GCCTCTGCGT 
TTTGAGGATG 



GGCATTGAAT 1920 

GAAAAAAACA 1980 

CTCAGCCTCA 2040 

TCCCCAAAAC 2100 

CTGAGCCCTG 2160 

CTTCAACGGT 2220 

AGCCATGCCC 2280 

AATCCCATTT 2340 

CTTTGCACCT 2400 

AAGGCTGAAC 2460 

GATTTGGGGA 252 0 



15 



Seq ID NO: 51 Protein sequence.* 
Protein Accession #:AAC26838 



20 



11 21 31 41 51 

I I I I I 

MNSQQQKQPC TPPPQPQQQQ VKQPCQPPPQ EPCIPKTKEP CQPKVPEPCH PKVPEPCQPK 

IPEPCQPKVP EPCPSTVTPA PAQQKTKQK 



60 



25 



Seq ID NO: 52 DNA sequence 

Nucleic Acid Accession #: NM_002638.1 

Coding sequence: 12 0-473 



11 



21 



31 



41 



51 



30 



35 



40 



45 



CAATACAGCT 
GCTGGACTGC 
TGAGGGCCAG 
AGGCAGCTGT 
TCAATGGACA 
CGCAAGAGCC 
TCCGGTGCGC 
TCAAGAAGTG 
CGGTCCTTGC 
TGCTGCCCTT 
GAGCTGCCTC 



AAGGAATTAT 
ATAAAGATTG 
CAGCTTCTTG 
CACGGGAGTT 
AGATCCCGTT 
AGT CAAAGGT 
CATGTTGAAT 
CTGTGAAGGC 
TGCACCTGTG 
CCCCTTCCCA 
TCTCATCCAC 



CCCTTGTAAA 
GTATGGCCTT 
ATCGTGGTGG 
CCTGTTAAAG 
AAAGGACAAG 
CCAGTCTCCA 
CCCCCTAACC 
TCTTGCGGGA 
CCGTCCCCAG 
CACTGTCCAT 
TTT CCAATAA 



TACCACAGAC 
AGCTCTTAGC 
TGTTCCTCAT 
GTCAAGACAC 
TTTCAGTTAA 
CTAAGCCTGG 
GCTGCTTGAA 
TGGCCTGTTT 
AGCTACAGGC 
TCTTCCTCCC 
A 



CCGCCCTGGA 
CAAACACCTT 
CGCTGGGACG 
TGTCAAAGGC 
AGGTCAAGAT 
CTCCTGCCCC 
AGATACTGAC 
CGTTCCCCAG 
CCCATCTGGT 
ATTCAGGATG 



GCCAGGCCAA 
CCTGACAGCA 
CTGGTTCTAG 
CGTGTTCCAT 
AAAGT C AAAG 
ATTATCTTGA 
TGCCCAGGAA 
TGAAGGGAGC 
CCTAAGTCCC 
CCCACGGCTG 



Seq ID NO: 53 Protein sequence: 
Protein Accession #: NP_002629.1 

1 11 21 31 41 51 

I I I I I I 

MRASSFLIW VFLIAGTLVL eaavtgvpvk GQDTVKGRVP FNGQDPVKGQ VSVKGQDKVK 
AQEPVKGPVS TKPGSCPIID IRCAMLNPPN RCLKDTDCPG IKKCCEGSCG MACFVPQ 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 



60 



50 



55 



60 



65 



70 



75 



80 



85 



Seq ID NO: 54 DNA sequence 

Nucleic Acid Accession #: NM_019618 

Coding sequence: 75-584 



GGCACGAGCC 
GAGACAACCA 
ATCAAT CAAT 
CCCTTCAGGG 
TTGCTGTTAT 
ATT TGGGAAT 
CATTGCAGCT 
CCTTCCTTTT 
CGGACTGGTT 
GGAAGTCATA 
GCAGCTTGGT 
AGTGTCATTT 
TAATGAAGAA 
GGAGAGCTGG 
CTGCATGAGT 
TGAAGATGCT 
CTCTGTTTCT 
CCAATATACC 
TAATTCTTGT 
AATAAACTTT 



11 

I 

ACGATTCAGT 
CACTATGAGA 
GTGTAAACCT 
TCAGAACCTT 
CACATGCAAG 
CCAGAAT CCA 
AAAAG AG C AG 
CTACCGTGCC 
CATTGCCTCC 
CAACACTGCC 
CTTTGTCTTA 
TCACGCTGGT 
GAAGCAATTA 
GTGGTATAAG 
GACTTTAAGA 
TCAGAGCTCA 
GTTTTGCTTT 
TCATTGTGTG 
GTTAAGTTAA 
GTGTATTTAT 



21 
I 

CCCCTGGACT 
GGCACTCCAG 
ATTACTGGGA 
GTGGCAGTTC 
TATCCAGAGG 
GAAATGTGTT 
AAGATCATGG 
AAGACTGGTA 
TCCAAGAGAG 
TTTGAATTAA 
AAGTTTCTGG 
GCTGAGACAG 
CTTCATAGCA 
GCTGTCCTCT 
CTCAAAGACC 
TGCGCGTTAC 
ATTCCCTCTT 
TAATAGAACC 
ATCATTTTTG 
ATAATAAAAA 



31 



GTAGATAAAG 
GAGACGCTGA 
CTATTAATGA 
CACGAAGTGA 
CTCTTGAGCA 
TGTATTGTGA 
ATCTGTATGG 
GGACCTCCAC 
ACCAGCCCAT 
ATATAAATGA 
TTCCCAATGT 
GGGCAAGGCT 
ACTGAAGAAC 
CAAGCTGGTG 
AAACACTGAG 
CCACGATGGC 
GGGATGATAT 
TTCTTAGCAT 
TCCTAATTGT 
AAAAAAAAAA 



41 
I 

ACCCTTTCTT 
TGGTGGAGGA 
TTTGAATCAG 
CAGTGTGACC 
AGGCAGAGGG 
GAAGGTTGGA 
CCAACCCGAG 
CCTTGAGTCT 
CATTCTGACT 
CTGAACT CAG 
GTTTTCGTCT 
GCTGTTATCA 
AGGATGTGGC 
CTGTGTAGGC 
CTTTCTTCTA 
ATGACTAGCA 
CATCCAGTCT 
TAAGACCTTG 
AATGTGTAAT 
AAA 



51 



GCCAGGTGCT 
AGGGCCGTCT 
CAAGTGTGGA 
CCAGTCACTG 
GATCCCATTT 
GAACAGCCCA 
CCCGTGAAAC 
GTGGCCTTCC 
TCAGAACTTG 
CCTAGAGGTG 
ACATTTTCTT 
TCTCATTTTA 
CTCAGAAGCA 
CACAAGGCAT 
GGGGTGGGTA 
CAGAGCTGAT 
TTATATGTTG 
TAAACAAAAA 
CTTAAAGTTA 



Seq ID NO: 55 Protein sequence: 
Protein Accession #: NP_062564 



1 
I 



11 



31 



41 



51 



21 

I I I I I 

MRGTPGDADG GGRAVYQSMC KPITGTINDL NQQVWTLQGQ NLVAVPRSDS VTPVTVAVIT 
CKYPEALEQG RGDPIYLGIQ NPEMCDYCEK VGEQPTLQLK EQKIMDLYGQ PEPVKPFLFY 
RAKTGRTSTL ESVAFPDWFI ASSKRDQPII LTSELGKSYN TAFELNIND 



Seq ID NO: 56 DNA sequence 

Nucleic Acid Accession #: NM_003125 

Coding sequence: 65-334 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 



60 
120 



208 



WO 02/086443 



PCT/US02/12476 



1 11 21 31 41 51 

I I 1 I 1 I 

AGCAGTTCTA AGGGACCATA CAGAGTATTC CTCTCTTCAC ACCAGGACCA GCCACTGTTG 60 

5 CAGCATGAGT TCCCAGCAGC AGAAGCAGCC CTGCATCCCA CCCCCTCAGC TTCAGCAGCA 120 

GCAGGTGAAA CAGCCTTGCC AGCCTCCACC TCAGGAACCA TGCATCCCCA AAACCAAGGA 180 
GCCCTGCCAC CCCAAGGTGC CTGAGCCCTG CCACCCCAAA GTGCCTGAGC CCTGCCAGCC ' 240 

CAAGCTTCCA GAGCCATGCC ACCCCAAGGT GCCTGAGCCC TGCCCTTCAA TAGTCACTCC 3 00 

AGCACCAGCC CAGCAGAAGA CCAAGCAGAA GTAATGTGGT CCACAGCCAT GCCCTTGAGG 3 60 

10 AGCCGGCCAC CAGATGCTGA ATCCCCTATC CCATTCTGTG TATGAGTCCC ATTTGCCTTG 420 

CAATTAGCAT TCTGTCTCCC CCAAAAAAGA ATGTGCTATG AAGCTTTCTT TCCTACACAC 480 

TCTGAGTCTC TGAATGAAGC TGAAGGTCTT AGTACCAGAG CTAGTTTTCA GCTGCTCAGA 540 

ATTCATCTGA AGAGAGACTT AAGATGAAAG CAAATGATTC AGCTCCCTTA TACCCCCATT 60 0 
AAATTCACTT TCAATTCCA 



Seq ID NO: 57 Protein sequence: 
Protein Accession #: NP 003116 

20 

1 11 21 31 41 51 

I I I 1 I I 

MSSQQQKQPC IPPPQLQQQQ VKQPCQPPPQ EPCIPKTKEP CHPKVPEPCH PKVPEPCQPK 60 
LPEPCHPKVP EPCPSIVTPA PAQQKTKQK 

25 

Seq ID NO: 58 DNA sequence 

Nucleic Acid Accession ft: NM_001793.2 

Coding sequence: 71-2560 

30 1 11 21 31 41 51 

I I I 1 I I 

AAAGGGGCAA GAGCTGAGCG GAACACCGGC CCGCCGTCGC GGCAGCTGCT TCACCCCTCT 60 

CTCTGCAGCC ATGGGGCTCC CTCGTGGACC TCTCGCGTCT CTCCTCCTTC TCCAGGTTTG 120 

CTGGCTGCAG TGCGCGGCCT CCGAGCCGTG CCGGGCGGTC TT CAGGGAGG CTGAAGTGAC 180 

35 CTTGGAGGCG GGAGGCGCGG AGCAGGAGCC CGGCCAGGCG CTGGGGAAAG TATT CATGGG 240 

CTGCCCTGGG CAAGAGCCAG CTCTGTTTAG CACTGATAAT GATGACTTCA CTGTGCGGAA 300 

TGGCGAGACA GTCCAGGAAA GAAGGTCACT GAAGGAAAGG AATCCATTGA AGATCTTCCC 3 60 

ATCCAAACGT ATCTTACGAA GACACAAGAG AGATTGGGTG GTTGCTCCAA TATCTGTCCC 420 

TGAAAATGGC AAGGGTCCCT TCCCCCAGAG ACTGAAT CAG CTCAAGTCTA ATAAAGATAG 480 

40 AGACACCAAG ATTTTCTACA GCAT C ACGGG GCCGGGGGCA GACAGCCCCC CTGAGGGTGT 540 

CTTCGCTGTA GAGAAGGAGA CAGGCTGGTT GTTGTTGAAT AAGCCACTGG ACCGGGAGGA 600 

GATTGCCAAG TATGAGCTCT TTGGCCACGC TGTGTCAGAG AATGGTGCCT CAGTGGAGGA 660 

CCCCATGAAC AT CTCCAT CA TCGTGACCGA CCAGAATGAC CACAAGCCCA AGTTTACCCA 720 

GGACACCTTC CGAGGGAGTG TCTTAGAGGG AGTCCTACCA GGTACTTCTG TGATGCAGGT 780 

45 GACAGCCACG GATGAGGATG ATG CCATCTA CACCTACAAT GGGGTGGTTG CTTACTCCAT 840 

CCATAGCCAA GAACCAAAGG ACCCACACGA CCTCATGTTC ACCATTCACC GGAGCACAGG 900 

CACCATCAGC GTCATCTCCA GTGGCCTGGA CCGGGAAAAA GTCCCTGAGT ACACACTGAC 960 

CATCCAGGCC ACAGACATGG ATGGGGACGG CTCCACCACC ACGGCAGTGG CAGTAGTGGA 1020 

GATCCTTGAT GCCAATGACA ATG CTCCCAT GTTTGACCCC CAGAAGTACG AGGCCCATGT 10 80 

50 GCCTGAGAAT GCAGTGGGCC ATGAGGTGCA GAGGCTGACG GTCACTGATC TGGACGCCCC 1140 

CAACTCACCA GCGTGGCGTG CCACCTACCT TATCATGGGC GGTGACGACG GGGACCATTT 12 00 

TACCATCACC ACCCACCCTG AGAGCAACCA GGGCATCCTG ACAACCAGGA AGGGTTTGGA 1260 

TTTTGAGGCC AAAAACCAGC ACACCCTGTA CGTTGAAGTG ACCAACGAGG CCCCTTTTGT 1320 

GCTGAAGCTC CCAACCTCCA CAGCCACCAT AGTGGTCCAC GTGGAGGATG TGAATGAGGC 1380 

55 ACCTGTGTTT GTCCCACCCT CCAAAGTCGT TGAGGTCCAG GAGGGCATCC CCACTGGGGA 1440 

GCCTGTGTGT GTCTACACTG CAGAAGACCC T G AC AAGG AG AATCAAAAGA TCAGCTACCG 1500 

CATCCTGAGA GACCCAGCAG GGTGGCTAGC CATGGACCCA GACAGTGGGC AGGTCACAGC 1560 

TGTGGGCACC CTCGACCGTG AGGATGAGCA GTTTGTGAGG AACAACATCT ATGAAGTCAT 1620 

GGTCTTGGCC ATGGACAATG GAAGCCCTCC CACCACTGGC ACGGGAACCC TTCTGCTAAC 1680 

60 ACTGATTGAT GTCAATGACC ATGGCCCAGT GCCTGAGCCC CGT CAGATCA CCATCTGCAA 1740 

CCAAAGCCCT GTGCGCCAGG TGCTGAACAT CACGGACAAG GACCTGTCTC CCCACACCTC 1800 

CCCTTTCCAG GCCCAGCTCA CAGATGACTC AGACAT CT AC TGGACGGCAG AGGTCAACGA 18 60 

GGAAGGTGAC ACAGTGGT CT TGTCCCTGAA GAAGTTCCTG AAGCAGGATA CATATGACGT 192 0 

GCACCTTTCT CTGTCTGACC ATGGCAACAA AGAGCAGCTG ACGGTGATCA GGGCCACTGT 1980 

65 GTGCGACTGC CATGGCCATG TCGAAACCTG CCCTGGACCC TGGAAGGGAG GTTTCATCCT 2040 

CCCTGTGCTG GGGGCTGTCC TGGCTCTGCT GTTCCTCCTG CTGGTGCTGC TTTTGTTGGT 2100 

GAGAAAGAAG CGGAAGATCA AGGAGCCCCT CCTACTCCCA GAAGATGACA CCCGTGACAA 2160 

CGTCTTCTAC TATGGCGAAG AGGGGGGTGG CGAAGAGGAC CAGGACTATG ACATCACCCA 222 0 

GCTCCACCGA GGTCTGGAGG CCAGGCCGGA GGTGGTTCTC CGCAATGACG TGGCACCAAC 22 80 

70 CATCATCCCG ACACCCATGT ACCGTCCTCG GCCAGCCAAC CCAGATGAAA TCGGCAACTT 2340 

TATAATTGAG AACCTGAAGG CGGCTAACAC AGACCCCACA GCCCCGCCCT ACGACACCCT 2400 

CTTGGTGTTC GACTATGAGG GCAGCGGCTC CGACGCCGCG TCCCTGAGCT CCCTCACCTC 2460 

CTCCGCCTCC GACCAAGACC AAGATTACGA TTATCTGAAC GAGTGGGGCA GCCGCTTCAA 2520 

GAAGCTGGCA GACATGTACG GTGGCGGGGA GGACGACTAG GCGGCCTGCC TGCAGGGCTG 2 580 

75 GGGACCAAAC GTCAGGCCAC AGAGCATCTC CAAGGGGTCT CAGTTCCCCC TTCAGCTGAG 2 640 

GACTTCGGAG CTTGTCAGGA AGTGGCCGTA GCAACTTGGC GGAGACAGGC TATGAGTCTG 2700 

ACGTTAGAGT GGTTGCTTCC TTAGCCTTTC AGGATGGAGG AATGTGGGCA GTTTGACTTC 2760 

AGCACTGAAA ACCTCTCCAC CTGGGCCAGG GTTGCCTCAG AGGCCAAGTT TCCAGAAGCC 2 82 0 

TCTTACCTGC CGTAAAATGC TCAACCCTGT GTCCTGGGCC TGGGCCTGCT GTGACTGACC 2880 

80 TACAGTGGAC TTTCTCTCTG GAATGGAACC TTCTTAGGCC TCCTGGTGCA ACTTAATTTT 2 940 

TTTTTTTAAT GCTATCTTCA AAACGTTAGA GAAAGTTCTT CAAAAGTGCA GCCCAGAGCT 3000 

GCTGGGCCCA CTGGCCGTCC TGCATTTCTG GTTTCCAGAC CCCAATGCCT CCCATTCGGA 3060 

TGGATCTCTG CGTTTTTATA CTGAGTGTGC CTAGGTTGCC CCTTATTTTT TATTTTCCCT 3120 

GTTGCGTTGC TATAGATGAA GGGTGAGGAC AATCGTGTAT ATGTACTAGA ACTTTTTTAT 3180 

85 TAAAGAAACT TTTCCCAGAA AAAAA 

Seq ID NO: 59 Protein sequence: 



209 



WO 02/086443 

Protein Accession #: NP 0 01784.2 



PCT/US02/12476 



11 21 31 41 51 

III!! 

MGLPRGPLAS LLLLQVCWLQ CAASEPCRAV FREAEVTLEA GGAEQEPGQA LGKVFMGCPG 60 

QEPALFSTDN DD FT VRNGET VQERRSLKER NPLKIFPSKR I LRRHKRDWV VAPISVPENG 120 

KGPFPQRLNQ LKSNKDRDTK IFYSITGPGA DSPPEGVFAV EKETGWLkLN KPLDREEIAK 180 

YELFGHAVSE NGASVEDPMN ISIIVTDQND HKPKFTQDTF RGSVLEGVIjP GTSVMQVTAT 240 

DEDDAIYTYN GWAYSIHSQ EPKDPHDLMF TIHRSTGTIS VISSGLDREK VPEYTLTIQA 300 

10 TDMDGDGSTT TAVAWEILD ANDNAPMFDP QKYEAHVPEN AVGHEVQRLT VTDLDAPNSP 360 

AWRATYL I MG GDDGDHFTIT THPESNQGIL TTRKGLDFEA KNQHTLYVEV TNEAPFVLKL 420 

PTSTATIWH VEDVNEAPVF VPPSKWEVQ EGIPTGEPVC VYTAEDPDKE NQKISYRILR 480 

DPAGWLAMDP DSGQVTAVGT LDREDEQ FVR NN I YEVMVLA MDNGSPPTTG TGTLLLTLID 540 

VNDHGPVPEP RQITICNQSP VRQVLN1 TDK DkSPHTSPFQ AQLTDDSDIY WTAEVNEEGD 60 0 

15 TWIiSLKKFL KQDTYDVHLS LSDHGNKEQL TVIRATVCDC HGHVETCPGP WKGGFILPVL 660 

GAVLALLFLL LVLLLLVRKK RKIKEPLLLP EDDTRDNVFY YGEEGGGEED QDYDITQLHR 72 0 

GLEARPEWL RNDVAPTIIP TPMYRPRPAN PDEIGNFIIE NLKAANTDPT APPYDTIiLVF 7 80 
DYEGSGSDAA SLSSLTSSAS DQDQDYDYLN EWGSRFKKLA DMYGGGEDD 

20 Seq ID NO: 60 DNA sequence 

Nucleic Acid Accession #: Eos sequence 
Coding sequence: 162-42 8 

_ 1 11 21 31 41 51 

25 | 1 l I ! I 

GCGTTCCGTT GGCGGCGGAT TCGAACGTTC GGACTGAGGT TTTTCTGCCT GAAGAAGCGT 60 

CATACGGACC GGATTGTTTT CGCTGGCCCA GTGTCCCCGG AGCTTGTGTG CGATACAGAG 12 0 

AGCACCT CGG AAGCTGAGGC AGCTGGTACT TGACAGAGAG GATGGCGCTG T CGACCAT AG 180 

TCTCCCAGAG GAAGCAGATA AAGCGGAAGG CTCCCCGTGG CTTTCTAAAG CGAGTCTTCA 240 

30 AGCGAAAGAA GCCTCAACTT CGTCTGGAGA AAAGTGGTGA CTTATTGGTC CATCTGAACT 300 

GTTTACTGTT TGT T CAT CGA TTAGCAGAAG AGTCCAGGAC AAACGCTTGT GCGAGTAAAT 360 

GTAGAGTCAT TAACAAGGAG CATGTACTGG CCGCAGCAAA GGTAATTCTA AAGAAGAGCA 420 

GAGGTTAGAA GTCAAAGAAC ATATTCTTGA AAGTTATGAT GCATTCTTTT GGGTGGTAAC 480 
AG AT CAT AAA GACATTTTTT ACACAT C AGT TAATATGGGA TTATTAAATA TTGG 
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Seq ID NO: 61 Protein sequence: 
Protein Accession #: Eos sequence 



1 11 21 31 41 51 

40 | | j | | | 

MALSTIVSQR KQIKRKAPRG FLKRVFKRKK PQLRLEKSGD LLVHLNCLLF VHRLAEESRT 60 
NACASKCRVI NKEHVLAAAK VILKKSRG 

Seq ID NO: 62 DNA sequence 
45 Nucleic Acid Accession #: NM_000094.2 
Coding sequence: 99-8933 

1 11 21 31 41 51 

<n 1 1 1 1 1 1 

Z>\J GGGCTGGAGG GGCGCTGGGC TCGGACCTGC CAAGGCCACC GCAGGGGGGA GCAAGGGACA 60 

GAGGCGGGGG TCCTAGCTGA CGGCTTTTAC TGCCTAGGAT GACGCTGCGG CTTCTGGTGG 120 
CCGCGCTCTG CGCCGGGATC CTGGCAGAGG CGCCCCGAGT GCGAGCCCAG CACAGGGAGA 180 
GAGTGACCTG CACGCGCCTT TACGCCGCTG ACATTGTGTT CTTACTGGAT GGCTCCTCAT 240 
CCATTGGCCG CAGCAATTTC CGCGAGGTCC GCAGCTTTCT CGAAGGGCTG GTGCTGCCTT 300 

55 TCTCTGGAGC AGCCAGTGCA CAGGGTGTGC GCTTTGCCAC AGTGCAGTAC AGCGATGACC 360 

CACGGACAGA GTTCGGCCTG GATGCACTTG GCTCTGGGGG TGATGTGATC CGCGCCATCC 420 
GTGAGCTTAG CTACAAGGGG GGCAACACTC GCACAGGGGC TGCAATTCTC CATGTGGCTG 480 
ACCATGTCTT CCTGCCCCAG CTGGCCCGAC CTGGTGTCCC CAAGGTCTGC ATCCTGATCA 540 
CAGACGGGAA GTCCCAGGAC CTGGTGGACA CAGCTGCCCA AAGGCTGAAG GGGCAGGGGG 600 

60 TCAAGCTATT TGCTGTGGGG AT CAAGAATG CTGACCCTGA GGAGCTGAAG CGAGTTGCCT 660 

CACAGCCAAC CTCCGACTTC TTCTTCTTCG TCAATGACTT CAGCATCTTG AGGACACTAC 720 
TGCCCCTCGT TTCCCGGAGA GTGTGCACGA CTGCTGGTGG CGTGCCTGTG ACCCGACCTC 780 
CGGATGACTC GACCTCTGCT CCACGAGACC TGGTGCTGTC TGAGCCAAGC AGCCAATCCT 840 
TGAGAGTACA GTGGACAGCG GCCAGTGGCC CTGTGACTGG CTACAAGGTC CAGTACACTC 900 

65 CTCTGACGGG GCTGGGACAG CCACTGCCGA GTGAGCGGCA GGAGGTGAAC GTCCCAGCTG 960 

GTGAGACCAG TGTGCGGCTG CGGGGTCTCC GGCCACTGAC CGAGTACCAA GTGACTGTGA 102 0 

TTGCCCTCTA CGCCAACAGC AT CGGGGAGG CTGTGAGCGG GACAGCTCGG ACCACTGCCC 1080 

TAGAAGGGCC GGAACTGACC ATCCAGAATA CCACAGCCCA CAGCCTCCTG GTGGCCTGGC 1140 

GGAGTGTGCC AGGTGCCACT GGCTACCGTG TGACATGGCG GGTCCTCAGT GGTGGGCCCA 12 00 

70 CACAGCAGCA GGAGCTGGGC CCTGGGCAGG GTTCAGTGTT GCTGCGTGAC TTGGAGCCTG 12 60 

GCACGGACTA TGAGGTGACC GTGAGCACCC TATTTGGCCG CAGTGTGGGG CCCGCCACTT 132 0 

CCCTGATGGC TCGCACTGAC GCTTCTGTTG AGCAGACCCT GCGCCCGGTC ATCCTGGGCC 13 80 

CCACATCCAT CCTCCTTTCC TGGAACTTGG TGCCTGAGGC CCGTGGCTAC CGGTTGGAAT 1440 

GGCGGCGTGA GACTGGCTTG GAGCCACCGC AGAAGGTGGT ACTGCCCTCT GATGTGACCC 150 0 

75 GCTACCAGTT GGATGGGCTG CAGCCGGGCA CTGAGTACCG CCTCACACTC TACACTCTGC 1560 

TGGAGGGCCA CGAGGTGGCC ACCCCTGCAA CCGTGGTTCC CACTGGACCA GAGCTGCCTG 1620 

TGAGCCCTGT AACAGACCTG CAAGCCACCG AGCTGCCCGG GCAGCGGGTG CGAGTGTCCT 1680 

GGAGCCCAGT CCCTGGTGCC ACCCAGTACC GCAT CATTGT GCGCAGCACC CAGGGGGTTG 1740 

AGCGGACCCT GGTGCTTCCT GGGAGTCAGA CAGCATTCGA CTTGGATGAC GTTCAGGCTG 1800 

80 GGCTTAGCTA CACTGTGCGG GTGTCTGCTC GAGTGGGTCC CCGTGAGGGC AGTGCCAGTG 1860 

TCCTCACTGT CCGCCGGGAG CCGGAAACTC CACTTGCTGT TCCAGGGCTG CGGGTTGTGG 192 0 

TGTCAGATGC AACGCGAGTG AGGGTGGCCT GGGGACCCGT CCCTGGAGCC AGTGGATTTC 1980 

GGATTAGCTG GAGCACAGGC AGTGGTCCGG AGTCCAGCCA GACACTGCCC CCAGACTCTA 2 040 

CTGCCACAGA CATCACAGGG CTGCAGCCTG GAACCACCTA CCAGGTGGCT GTGTCGGTAC 2100 

85 TGCGAGGCAG AGAGGAGGGC CCTGCTGCAG TCATCGTGGC TCGAACGGAC CCACTGGGCC 2160 

CAGTGAGGAC GGTCCATGTG ACTCAGGCCA GCAGCTCATC TGTCACCATT ACCTGGACCA 2220 

GGGTTCCTGG CGCCACAGGA TACAGGGTTT CCTGGCACTC AGCCCACGGC CCAGAGAAAT 2280 
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CCCAGTTGGT TTCTGGGGAG GCCACGGTGG 
AGTATACGGT GCATGTGAGG GCCCATGTGG 
TTGTGAGGAC TGCCCCTGAG CCTGTGGGTC 
CCAGCGACGT TCTACGGATC ACCTGGGTAG 
5 CCTGGGGCCG GAGTGAAGGC GGCCCCATGA 

CTGCAGAGAT CCGGGGTCTC GAAGGTGGAG 
TCGGGGACCG CGAGGGCACA CCTGTCTCCA 
CAGCCCTGGG GACGCTTCAC GTGGTGCAGC 
AGCCGGTGCC CAGAGCG CAG GGCTTCCTTC 

10 AGTCCCGGGT CCTGGGGCCG GAGCTCAGCA 

CACAGTACCG CGTGAGGCTG AGTGTCCTAG 
TGACTGCGCG CACTGAGT CA CCTCGTGTTC 
CGAT CGACTC GGTGACTTTG GCCTGGACTC 
CCTGGCGGCC ACTCAGAGGC CCTGGCCAGG 

15 GGATCTCAAG CTCCCAGCGG GTGACAGGGC 

TGACGCCTGT CCTGGATGGT GTGCGGGGTC 
GCCCCCGTGG CCTGGCGGAT GTGGTGTTCC 
GTGCGGAGGC TACGAGGAGG GTCCTGGAGC 
CACAGGCAGT TCAGGTTGGC CTGCTGTCTT 

20 TGAATGGCTC CCATGACCTT GGCATTATCT 

ACCCAAGTGG GAACAACCTG GGCACAGCCG 
CAGATGCTCC TGGGCGCCGC CAGCACGTAC 
CCTTGAGAGG TGACATATTC AGCCCCATCC 
TGATGTTGGG AATGGCTGGA GCGGACCCAG 

25 ACTCTGTCCA GACCTTCTTC GCCGTGGATG 

GTCTGGCCAC AGCCCTGTGT CAGGCATCCT 
CAGTGTATTG TCCAAAGGGC CAGAAGGGGG 
TTGGGCCTCC TGGCGACCCT GGCCTCCCGG 
CCCCTGGAAG TGCCACTGCC AAGGGCGAGA 

30 GCAGCCCTGG CCGCGCCGGG AATCCTGGGA 

CAGGGTTGCC TGGCCCTCGT GGGGACCCGG 
AGCCGGGGGC TCCCGGACAA GT CAT CGG AG 
GGGACCCTGG ACCAT CGGGC CCCCCTGGAC 
GTGGCCCCCC AGGGCTTCCT GGAACAGCCA 

35 GGGGTCCCCC TGG AC CAGGT GAAGGTGGCA 

TTCCCGGAAG CCCTGGACCC CAAGGCCCCG 
GTGACTCTGA GGATGGAGCT CCAGGCCTCC 
GCCCACGGGG ACCTCCTGGA GCTATTGGCC 
TGGGTGAGGC TGGAGAGAAG GGCGAACGTG 

40 TGCCAGGGGT TGCTGGACGT CCTGGAGCCA 

GCCGCCAAGG AGAGAAGGGG GAGCCTGGTC 
CTGTTGCTGG ACCCAAAGGA GAAAAGGGAG 
CCGGAGTCCA AGGGGAACGG GGCCCACCCG 
AGGGAGACCC TGGAGACCGG GGTCCCATTG 

45 ACTCAGGGCC TCCTGGAGAG AAGGGAGACC 

GCCCCCGAGG ACGAGATGGT GAAGTTGGAG 
CGGGTTTGCC TGGAAAAG CA GGCGAGCGTG 
CTGTGGGTGA AAAGGGAGAC CAGGGAGATC 
GAT CAT CTGG ACCCAAGGGT GACCGTGGGG 

50 TGGTAGACAC AGGACCTGGA GCCAGAGAGA 

GTCCTCGAGG GCCCAAGGGT GATCCTGGCC 
AAGGGTTTCG GGGACCCCCA GGCCCACAGG 
AAAAGGGTGA CCGGGGTCCC CCTGGGCTGG 
GAGCCGCTGG GCCCTCTGGG CCGAATGGTG 

55 ACGGGCTTCC AGGCCTCCGT GGAGAACAAG 

TACCGGGAAA GCCAGGCGAG GATGGGAAAC 
GGGACCCTGG AGAAGACGGG AGGAAGGGAG 
AAGGTCGTGA TGGCCCCAAG GGTGAGCGTG 
CTCCAGGCCT CCCAGGGCCA GTGGGCCCTC 

60 GCACGGGCCC CAAGGGTGAC CGTGGGGAGA 

GAGAGCGTGG CCTGCGAGGA GAGCCTGGAA 
CTGCTGGCAT CAAGGCATCT GCCCTGCGGG 
GTAGCTTCCT GCCTGTGCCC GAACGGCGTC 
GCCCCCCAGG CAAGGAGGGC CCCATCGGCT 

65 GTGGAGACCC TGGCCCTCAG GGGCCACCTG 

GGCCTTCCGG CCTTGCCGGG GAGCCTGGAA 
CTGGGGGTGT GGGAGAGGCA GGAAGGCCAG 
AACG TGG AG A ACAGGGCAGA GATGGCCCTC 
GACCCCCTGG CCCCAAGGTG TCTGTGGATG 

70 GACCCCCTGG ACTCAAGGGT GCTAAGGGGG 
AAGGAGACAG GGGTGTGCCA GGCATCAAAG 
AGGACGGCAA CCCGGGTCTA CCAGGAGAGC 
GTCTGCAGGG TCCAAGAGGC CCCCCTGGCC 
CTGGTGCCCC GGGTCTTGCT GGCCCTGCAG 

75 AGCCTGGAGA GACAGGACCT CCAGGACGGG 

TTCCTGGACC CCCCGGCCCT TCAGGCCTTG 
GACAAGTGGG GGAGACAGGG AAGCCGGGAG 
ATGGAGACAG AGGGAGCCCT GGTGTGCCAG 
CTAAAGGAGA ACCTGGCCCC ACGGGGGCCC 

80 CAAAGGGAGA GAAGGGAGCC CCTGGAGGCC 

CCAAAGGTGA CCGAGGACTG CCAGGGCCGC 
GGGAGCCCGG AGACCCTGGG GAAGATGGTC 
AGGGTGACCC AGGAGT CGGG GTCCCGGGCT 
AGGGAGATCT GGGCCTCCCT GGCCTGCCCG 

85 AGACAGGCCC TCGAGGAGAG ATGGGTCAGC 

GCCCCCCAGG GAGAGAAGGA ATCCCAGGAC 
TGGGACCACC TQGGGCCTCT GGACTCAAAG 



CTGAGCTGGA TGGACTGGAG CCAGATACTG 2340 

CTGGCGTGGA TGGGCCCCCT GCCTCTGTGG 2400 

GTGTGTCGAG GCTGCAGATC CTCAATGCTT 2460 

GGGTCACTGG AGCCACAGCT TACAGACTGG 2520 

GGCACCAGAT ACTCCCAGGA AACACAGACT 2580 

TCAGCTACTC AGTGCGAGTG ACTGCACTTG 2640 

TTGTTGTCAC TACGCCGCCT GAGGCTCCGC 2700 

GCGGGGAGCA CTCGCTGAGG CTGCGCTGGG 2760 

TGCACTGGCA ACCTGAGGGT GGCCAGGAAC 2820 

GCTATCACCT GGACGGGCTG GAGCCAGCGA 2880 

GGCCGGCTGG AGAAGGGCCC TCTGCAGAGG 2940 

CAAGCATTGA ACTACGTGTG GTGGACACCT 3000 

CAGTGTCCAG GGCATCCAGC TACATCCTAT 3060 

AAGTGCCTGG GTCCCCGCAG ACACTTCCAG 3120 

TAGAGCCTGG CGTCTCT TAG ATCTTCTCCC 3180 

CTGAGGCATC TGT CACACAG ACGCCAGTGT 3240 

TACCACATGC CACTCAAGAC AATGCTCACC 3300 

GTCTGGTGTT GGCACTTGGG CCTCTTGGGC 3360 

ACAGTCATCG GCCCTCCCCA CTGTTCCCAC 342 0 

TGCAAAGGAT CCGTGACATG CCCTACATGG 3480 

TGGTCACAGC TCACAGATAC ATGTTGGCAC 3540 

CAGGGGTGAT GGTTCTGCTA GTGGATGAAC 360 0 

GTGAGGCCCA GGCTTCTGGG CTTAATGTGG 3 660 

AGCAGCTGCG TCGCTTGGCG CCGGGTATGG 372 0 

ATGGGCCAAG CCTGGACCAG GCAGTCAGTG 3780 

TCACTACTCA GCCCCGGCCA GAGCCCTGCC 3840 

AACCTGGAGA GATGGGCCTG AGAGGACAAG 3 900 

GCAGGACCGG TGCTCCCGGC CCCCAGGGGC 3 960 

GGGGCTTCCC TGGAGCAGAT GGGCGTCCAG 4020 

CCCCTGGAGC CCCTGGCCTA AAGGGCTCTC 4080 

GAGAGCGAGG ACCTCGAGGC CCAAAGGGGG 414 0 

GTGAAGGACC TGGGCTTCCT GGGCGGAAAG 4200 

CTCGTGGACC ACTGGGGGAC CCAGGACCCC 42 60 

TGAAGGGTGA CAAAGGCGAT CGTGGGGAGC 4320 

TTGCTCCTGG GGAGCCTGGG CTGCCGGGTC 43 80 

TTGGCCCCCC TGGAAAGAAA GGAGAAAAAG 444 0 

CAGGACAACC TGGGTCTCCG GGTGAGCAGG 4500 

CCAAAGGTGA CCGGGGCTTT CCAGGGCCCC 4560 

GACCCCCAGG CCCAGCGGGA TCCCGGGGGC 462 0 

AGGGTCCTGA AGGGCCACCA GGACCCACTG 4680 

GCCCTGGGGA CCCTGCAGTG GTGGGACCTG 4740 

ATGTGGGGCC CGCTGGGCCC AGAGGAGCTA 480 0 

GCTTGGTTCT TCCTGGAGAC CCTGGCCCCA 4860 

GCCTTACTGG CAGAGCAGGA CCCCCAGGTG 4 92 0 

CTGGGCGGCC TGGCCCCCCA GGACCTGTTG 498 0 

AGAAAGGTGA CGAGGGTCCT CCGGGTGACC 5040 

GCCTTCGGGG GGCACCTGGA GTTCGGGGGC 5100 

CTGGAGAGGA TGGACGAAAT GGCAGCCCTG 5160 

AGCCGGGTCC CCCAGGACCC CCGGGACGGC 522 0 

AGGGAGAGCC TGGGGACCGC GGACAAGAGG 5280 

TCCCTGGAGC CCCTGGGGAA AGGGGCATTG 5340 

GGGACCCAGG TGTCCGAGGC CCAGCAGGAG 5400 

ATGGCCGGAG CGGACTGGAT GGGAAACCAG 5460 

CTGCAGGCAA AGCTGGGGAC CCAGGGAGAG 552 0 

GCCTCCCTGG CCCCTCTGGT CCCCCTGGAT 5580 

CTGGCCTGAA TGGAAAAAAC GGAGAACCTG 5640 

AGAAAGGAGA TTCAGGCGCC TCTGGGAGAG 570 0 

GAGCTCCTGG TATCCTTGGA CCCCAGGGGC 5760 

CTGGCCAGGG TTTTCCTGGT GT CCCAGGAG 582 0 

CTGGAT CCAA AGGGGAGCAG GGCCTCCCTG 5880 

GTGTGCCGAA TGTGGATCGG TTGCTGGAAA 5940 

AGATCGTGGA GACCTGGGAT GAGAGCTCTG 600 0 

GAGGCCCCAA GGGGGACTCA GGCGAACAGG 6060 

TTCCTGGAGA ACGCGGGCTG AAGGGCGACC 612 0 

GTCTGGCCCT TGGGGAGAGG GGCCCCCCCG 6180 

AGCCTGGTAT TCCCGGGCTC CCAGGCAGGG 6240 

GAGAGAGGGG AGAACGGGGA GAGAAAGGAG 630 0 

CTGGACTCCC TGGAACCCCT GGGCCCCCCG 6360 

AGCCAGGTCC TGGACTCTCT GGAGAACAGG 6420 

AGCCGGGCAG CAATGGTGAC CAAGGTCCCA 648 0 

GAGACCGGGG AGAGCCTGGA CCGAGGGGTC 654 0 

GTGGTATGGC TGGGCCTGAA GGGAAGCCGG 6600 

CAGTGGGTGG TCATGGAGAC CCTGGACCAG 6660 

GACCCCAAGG ACCTTCTGGC CTGAAGGGGG 6720 

GCCTGACTGG ACCTACTGGA GCTGTGGGAC 6780 

TGGGT CCACA GGGGTCTCCA GGTTTGCCTG 6840 

CCCCAGGTCG AGATGGTGCC AGTGGAAAAG 6900 

GGTCACCAGG TCTGCCTGGC CCTGTCGGAC 6960 

CTGGACAGGC TGTGGTCGGG CTCCCTGGAG 702 0 

TTGCTGGAGA CCTGGTGGGT GAGCCGGGAG 70 80 

GAGGCGAGAA GGGTGAAGCT GGCCGTGCAG 7140 

AGAAAGGGGC TCCAGGACCC AAAGGTTTCA 7200 

CCCCTGGGCC TCCTGGCCCT CCAGGTGTGA 72 60 

GTGCTCCTGG TGTTGTTGGG TTCCCGGGTC 732 0 

CAGGCCCTAG TGGAGAGCGG GGTCTGGCAG 73 80 

CCCTGGGGCC ACCTGGACCA CCGGGGTCAG 7440 

GAGACAAGGG AGACCCTGGA GTAGGGCTGC 7500 
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CTGGGCCCCG AGGCGAGCGT 
AGGAGGGACC CCGAGGACTC 
GTGATGTTGG GAGTGCAGGA 
CTCCAGGCCC ACGGGGTGCC 
GTGACAAAGG ACCTCGGGGA 
CTGGTGACAA GGGCTCAGCC 
AACCTGGTGC AGCAGGGATC 
GTATCCGAGG AGAAAAAGGA 
GGGGAGTGAA GGGAGCCTGT 
CCCCAGGCCG CCCCGGGCTG 
GCCAGTCGGG GGCCCCTGGC 
ACGGGCAGCC AGGCCCCAAG 
TTGGGGGCTT CCCAGGCCCC 
GCAGTGTTGG TCCCAGAGGC 
CCGGAGAGAG AGTGGTGGGG 
AGGGGCGGCC AGGGCCTGCC 
ATGACATCCG GGGCTTTGTG 
TCATCGCATC TGGATCACGA 
TCCATGCTGT GCCTGTGCTC 
AGGATGATGA GTACTCTGAA 
CTCCTTGGGA TAGTGATGAC 
ACACCCTGCG CTGGTACCAT 
TCTATGGTGG CTGTGGAGGG 
GCTGCCCACC CCGGGTGGTC 
ATAATGAGCT G AGATT CAGC 
CCCTCCCCTT GGTGCTAGAG 
TCAGTGACTT GGTCCCGTGG 
CCTGCCACCC TGG C AG AT G A 
ACTGGCGTCT GACCCGCCCC 
GCATTAAAGC TGCTGTTTTA 
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GGGGAGCCAG 
ACGGGGCCCC 
CTAAAGGGTG 
AAGGGGGACA 
GACAATGGGG 
GGGTTGCCAG 
CCTGGTGACC 
GATGTTGGCT 
GGCCTTGATG 
GCAGGACACA 
AAGGAGGGCC 
GGTGACCAGG 
AGTGGAAATG 
CCCGAAGGAC 
GCTCCTGGGG 
GGTCCTCGAG 
CGCCAAGAGA 
CCCCTCCCTA 
CGCGTCTCTC 
TACTCCGAGT 
CCCTGTTCCC 
CGGGCTGTGA 
AATGCCAACC 
CAGAGCCAGG 
ATCCCCTGGA 
GCTTGTGTGC 
GTCTAGCCTT 
CTCACTGTGG 
TTGACCCAAG 
AAAGGCAAAA 



GCATCCGGGG 
CTGGCAGCAG 
ACAAGGGAGA 
TGGGTGAACG 
ACCCTGGTGA 
GACTGCGTGG 
CGGGATCCCC 
TCATGGGTCC 
GAGAGAAGGG 
AAGGAGAGAT 
TGATCGGTCC 
GCGAGAAAGG 
ATGGCTCTGC 
TTCAGGGCCA 
TCCCTGGAGC 
GCGAGAAGGG 
TGAGT CAGCA 
GTTATGCTGC 
ATGCAGAGGA 
ATTCTGTGGA 
TGCCACTGGA 
CAGGCAGCAC 
GTTTTGGGAC 
GGACAGGTAC 
GGAGTCGGGG 
ACGTGAGCGT 
CCCCCCTGTG 
GGGGGTGGCT 
CCTGTGATGA 
AA 



TGAAGATGGC 
GGGAGAGCGT 
CTCAGCTGTG 
AGGGCCTCGG 
CAAGGGCAGC 
ACTCCTGGGA 
AGGAAAGGAT 
CCGGGGCCTC 
AGACAAGGGA 
GGGGGAGCCT 
CAAGGGTGAC 
GGAGCGGGGA 
TGGTCCCCCA 
GAAGGGTGAG 
TCCTGGCGAG 
AGAAGCTGCA 
CTGTGCCTGG 
AGACACTGCC 
GGAAGAGCGG 
GGAGTACCAG 
TGAGGGCTCC 
AGAGGCCTGT 
CCGTGAGGCC 
TGCCCAGGAC 
TCTCAGCAGA 
GCGAGTGCAC 
GACAAACCCC 
GTGGGCAGTG 
CATGGTGCTG 



CGCCCCGGCC 7560 

GGGGAGAAGG 7620 

ATCCTGGGGC 7680 

GGCTTGGATG 7740 

AAGGGAGAGC 7800 

CCCCAGGGTC 7860 

GGAGTGCCTG 7 920 

AAGGGTGAAC 7980 

GAAGCTGGTC 8040 

GGTGTGCCGG 8100 

CGAGGCTTTG 8160 

ACCCCAGGAA 8220 

GGGCCACCTG 8280 

CGAGGTCCCC 8340 

AGAGGGGAGC 8400 

CTGACGGAGG 8460 

CAGGGCCAGT 8520 

GGCTCCCAGC 8580 

GTACCCCCTG 8640 

GACCCTGAAG 8700 

TGCACTGCCT 8760 

CACCCTTTTG 882 0 

TGCGAGCGCC 8 880 

TGAGGCCCAG 8940 

ACCCCACTGT 9000 

GTCCGTTATT 9060 

CATTGTGGCT 9120 

AGCGGATGTG 9180 

ATTGTGGGGG 9240 



Seq ID NO: 63 Protein sequence: 
Protein Accession ft: NP_ 000085.1 
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70 



75 



80 



85 



MTLRLLVAAL 
LEGLVIiPFSG 
AAILHVADHV 
EELKRVASQP 
SEPSSQSLRV 
TEYQVTVIAL 
RVLSGGPTQQ 
LRPVILGPTS 
RLTLYTLLEG 
VRSTQGVERT 
VPGLRVWSD 
YQVAVSVLRG 
SAHGPEKSQb 
RLQILNASSD 
SVRVTALVGD 
QPEGGQEQSR 
ELRWDTSID 
GVSYIFSLTP 
LALGPLGPQA 
AHRYMLAPDA 
RRLAPGMDSV 
EMGLRGQVGP 
APGLKGSPGL 
PLGDPGPRGP 
PGKKGEKGDS 
GPAGSRGLPG 
PAGPRGATGV 
PGPPGPVGPR 
DGRNGSPGSS 
APGERGIEGF 
KAGDPGRDGL 
DSGASGREGR 
KGEQGIiPGER 
KGDSGEQGPP 
IPGLPGRAGG 
PGLSGEQGPP 
AGPEGKPGLQ 
GPTGAVGLPG 
GLPGPVGPKG 
KGEAGRAGEP 
GWGFPGQTG 
GDPGVGLPGP 
DSAVILGPPG 
GLLGPQGQPG 
GDKGEAGPPG 
GERGTPGIGG 
APGERGEQGR 
ADTAGSQLHA 
D EGSCTA YTL 
TAQD 



11 
I 

CAGI LAEAPR 
AASAQGVRFA 
FLPQLARPGV 
TSDFFFFVND 
QWTAASGPVT 
YANSIGEAVS 
QELGPGQGSV 
ILLSWNLVPE 
HEVATPATW 
LVLPGSQTAF 
ATRVRVAWGP 
REEGPAAVIV 
VSGEATVAEL 
VLRITWVGVT 
REGTPVSIW 
VLGPELSSYH 
SVTLAWTPVS 
VLDGVRGPEA 
VQVGLLSYSH 
PGRRQHVPGV 
QTFFAVDDGP 
PGDPGLPGRT 
PGPRGDPGER 
PGLPGTAMKG 
EDGAPGLPGQ 
VAGRPGAKGP 
QGERGPPGLV 
GRDGEVGEKG 
GPKGDRGEPG 
RGPPGPQGDP 
PGLRGEQGLP 
DGPKGERGAP 
GIiRGEPGSVP 
GKEGPIGFPG 
VGEAGRPGER 
GLKGAKGEPG 
GPRGPPGPVG 
PPGPSGLVGP 
EPGPTGAPGQ 
GDPGEDGQKG 
PRGEMGQPGP 
RGERGEPGIR 
PRGAKGDMGE 
AAGIPGDPGS 
RPGLAGHKGE 
FPGPSGNDGS 
PGPAGPRGEK 
VPVLRVSHAE 
RWYHRAVTGS 



21 
I 

VRAQHRERVT 

TVQYSDDPRT 

PKVCILITDG 

FSILRTLLPL 

GYKVQYTPLT 

GTARTTALEG 

LLRDLEPGTD' 

ARGYRLEWRR 

PTGPELPVSP 

DLDDVQAGLS 

VPGASGFRIS 

ARTDPLGPVR 

DGLEPDTEYT 

GATAYRLAWG 

TTPPEAPPAL 

LDGLEPATQY 

RASSYILSWR 

SVTQTPVCPR 

RPSPLFPLNG 

MVLLVDEPLR 

SLDQAVSGLA 

GAPGPQGPPG 

GPRGPKGEPG 

DKGDRGERGP 

PGSPGEQGPR 

EGPPGPTGRQ 

LPGDPGPKGD 

DEGPPGDPGL 

PPGPPGRLVD 

GVRGPAGEKG 

GPSGPPGLPG 

GILGPQGPPG 

NVDRLLETAG 

ERGLKGDRGD 

GERGEKGERG 

SNGDQGPKGD 

GHGDPGP PGA 

QGSPGLPGQV 

AWGLPGAKG 

APGPKGFKGD 

SGERGLAGPP 

GEDGRPGQEG 

RGPRGLDGDK 

PGKDGVPGIR 

MGEPGVPGQS 

AGPPGPPGSV 

GEAALTEDD I 

EEERVPPEDD 

TEACHPFVYG 
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CTRLYAAD IV 
EFGLDALGSG 
KSQDLVDTAA 
VSRRVCTTAG 
GLGQPLPSER 
PEDTIQNTTA 
YEVTVSTLFG 
ETGLEPPQKV 
VTDLQATELP 
YTVRVSARVG 
WSTGSGPESS 
TVHVTQASSS 
VHVRAHVAGV 
RSEGGPMRHQ 
GTLKWQRGE 
RVRLSVLGPA 
PLRGPGQEVP 
GLADWFLPH 
SHDLGIILQR 
GDIFSPIREA 
TALCQASFTT 
SATAKGERGF 
APGQVIGGEG 
PGPGEGGIAP 
GPPGAIGPKG 
GEKGEPGRPG 
PGDRGPIGLT 
PGKAGERGLR 
TGPGAREKGE 
DRGPPGLDGR 
KPGEDGKPGL 
LPGPVGPPGQ 
IKASAIjREIV 
PGPQGPPGLA 
EQGRDGPPGL 
RGVPGIKGDR 
PGLAGPAGPQ 
GETGKPGAPG 
EKGAPGGLAG 
PGVGVPGSPG 
GREGIPGPLG 
PRGLTGPPGS 
GPRGDNGDPG 
GEKGDVGFMG 
GAPGKEGLIG 
GPRGPEGLQG 
RGFVRQEMSQ 
EYSEYSEYSV 
GCGGNANRFG 



41 
I 

FLLDGSSSIG 
GDVIRAIREL 
QRLKGQGVKL 
GVPVTRPPDD 
QEVNVPAGET 
HSLLVAWRSV 
RSVGPATSLM 
VLPSDVTRYQ 
GQRVRVSWSP 
PREGSASVLT 
QTLPPDSTAT 
SVTITWTRVP 
DGPPASVWR 
ILPGNTDSAE 
HSLRLRWEPV 
GEGPSAEVTA 
GSPQTLPGIS 
ATQDNAHRAE 
IRDMPYMDPS 
QASGLNWML 
QPRPEPCPVY 
PGADGRPGSP 
PGLPGRKGDP 
GEPGLPGLPG 
DRGFPGPLGE 
DPAWGPAVA 
GRAGPPGDSG 
GAPGVRGPVG 
PGDRGQEGPR 
SGLDGKPGAA 
NGKNGEPGDP 
GFPGVPGGTG 
ETWDESSGSF 
LGERGPPGPS 
PGTPGPPGPP 
GEPGPRGQDG 
GPSGLKGEPG 
RDGASGKDGD 
DLVGEPGAKG 
PPGPPGVKGD 
PPGPPGSVGP 
RGERGEKGDV 
DKGSKGEPGD 
PRGLKGERGV 
PKGDRGFDGQ 
QKGERGPPGE 
HCACQGQFIA 
EEYQDPEAPW 
TREACERRCP 



51 
I 

RSNFREVRSF 60 

SYKGGNTRTG 120 

FAVGIKNADP 180 

STSAPRDLVL 240 

SVRLRGLRPL 300 

PGATGYRVTW 360 

ARTDASVEQT 420 

LDGLQPGTEY 480 

VPGATQYRII 54 0 

VRREPETPLA 600 

DITGLQPGTT 660 

GATGYRVSWH 720 

TAPEPVGRVS 780 

IRGLEGGVSY 840 

PRAQGFLLHW 900 

RTESPRVPSI 960 

SSQRVTGLEP 1020 

ATRRVLERLV 1080 

GNNLGTAWT 1140 

GMAGADPEQL 1200 

CPKGQKGEPG 1260 

GRAGNPGTPG 1320 

GPSGPPGPRG 1380 

SPGPQGPVGP 1440 

AGEKGERGPP 1500 

GPKGEKGDVG 1560 

PPGEKGDPGR 1620 

EKGDQGDPGE 1680 

GPKGDPGLPG 1740 

GPSGPNGAAG 1800 

GEDGRKGEKG 1860 

PKGDRGETGS 1920 

LPVPERRRGP 1980 

GLAGEPGKPG 2040 

GPKVSVDEPG 2100 

NPGLPGERGM 2160 

ETGPPGRGLT 2220 

RGSPGVPGSP 2280 

DRGLPGPRGE 2340 

LGLPGLPGAP 2400 

PGASGLKGDK 2460 

GSAGLKGDKG 2520 

KG S AGLPGLR 2580 

KGACGLDGEK 2640 

PGPKGDQGEK 2700 

RWGAPGVPG 2760 

SGSRPLPSYA 2820 

DSDDPCSLPL 2880 

PRWQSQGTG 2940 



212 



10 



WO 02/086443 

Seq ID NO: 64 DNA sequence 

Nucleic Acid Accession #: NM_006945 

Coding sequence: 1-219 

1 11 21 31 41 51 

I I I I I I 

ATGTCTTATC AACAGCAGCA GTGCAAGCAG CCCTGCCAGC CACCTCCTGT GTGCCCCACG 
CCAAAGTGCC CAGAGCCATG TCCACCCCCG AAGTGCCCTG AGCCCTGCCC AC CAC CAAAG 
TGT CCACAGC CCTGCCCACC TCAGCAGTGC CAGCAGAAAT ATCCTCCTGT GACACCTTCC 
CCACCCTGCC AGCCAAAGTA TCCACCGAAG AGCAAGTAA 



60 
120 
180 



PCT7US02/12476 
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Seq ID NO: 65 Protein sequence: 
Protein Accession #: NP 008876 
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21 31 41 51 

1 I I I I I 

MSYQQQQCKQ PCQPPPVCPT PKCPEPCPPP KCPEPCPPPK CPQPCPPQQC QQKYPPVTPS 
PPCQPKYPPK SK 

Seq ID NO: 66 DNA sequence 

Nucleic Acid Accession #: NM_005629.1 

Coding sequence: 63 9-2 546 



60 



11 



85 



TAGTCGGAGC 
CCGCCGCCGG 
CCGCCGCCAC 
CGGGGCGGGG 
CCGATGTCGC 
GCCGCCGCCC 
GCCGGGCCCC 
CTCACTTTCA 
CGTCCGCCCG 
CCTCGGGGCC 
GCCGCGACCC 
ACGGCATCTA 
ACGGGGCCCC 
CCGTGCCGCC 
TCGCCGTGGG 
GTGTGTTCCT 
TAG AG AT C T C 
CCCTGTTCAA 
ACATCATGGT 
CCTGGGCCAC 
AAGACTGTGC 
CCCCTGTCAT 
CAGGGGCCCT 
TCTGTGTCTG 
CCTACGTGGT 
GCATCATTTA 
ATGCGGGGAC 
GCAGCTACAA 
ACAGTGGGAC 
CAGAGCAGGG 
CCTACCCGCG 
TCATGCTGTT 
GCCTCCTCGA 
CCCTCTGTTG 
ACGTCTTCCA 
TTTGGGAGTG 
CCTGTATGAT 
CGCTGGTCTG 
ACAACACCTA 
CCATGCTGTG 
CTGAGCGCTG 
CTCAGGACGC 
TCGTCGTGGT 
GCCATAGCAG 
CACTTTTGGG 
ACTTTTTCCA 
TCCCCCTCCA 
CAGTGCTGCA 
CTCTGCAGCA 
TGTGAGGAAG 
GAGGGGCAGC 
TTATAGAAGC 
CCAGTATCAA 
TATAGATCTC 
GGAGGCTTGT 
TTTCTAAAAA 
CCTACCTTAC 
GCAAAACAAA 
GTCCCCAGCC 
GCTGTCCCTT 
GGGCTGCTAA 
GACCCTGGAC 



GAGGTGGCGA 
GAAGGAGAGG 
CACCGCCACC 
GGCGCGGGCC 
CCGCGCCCCG 
GAGCCGCGGG 
GACGCCGCCC 
AGTGCTTCGT 
CCGCCCCGTC 
CTCCCCGGTG 
CGGCCCGGCC 
TAGCGTGTCC 
GGCCAAGGGC 
GCGCGAGACC 
CTTGGGCAAC 
TATTCCCTAC 
GCTGGGCCAG 
AGGCCTGGGC 
GCTGGCCTGG 
ATGTGGCCAC 
CAATGCCAGC 
CGAGTTCTGG 
CAACTGGGAG 
GAAGGGGGTC 
CCTGGTCGTG 
CTATCTCAAG 
CCAGATTTTC 
CCGCTTCAAC 
CAGCTTCTTT 
CGTGCACATC 
GGCTGTCACG 
GCTGCTTGGT 
CCTCCTCCCG 
TGCCCTCTGC 
GCTGTTTGAC 
CGTGGTGGTG 
CGGGTACCGA 
CATGGGCATC 
CGTGTACCCG 
CGTGCCGCTG 
GCAGCACCTG 
AGATGTCAGG 
GGAGAGTGTC 
CCCCTGCTTC 
GTCTGCCTGG 
TTTTTAATAA 
GCCCTAGCCG 
CTCCTCCTGC 
CACCCGTGGG 
GGAAGGAGGG 
AGAACCAAGG 
TTAGAGAGCC 
TTGTGTGAGC 
TATCTCTTAG 
ATTTTGCACA 
GAGGAAGGAG 
CCCTCTGCCC 
AGCTTCGAGC 
CCAGACTGGA 
TGCCACAAGT 
CCTGGCCTGC 
ACGGCTCCCA 



21 
I 

GTCGCTGAGC 
GCGAGGCGCG 
GGAGTCGCGG 
ACAGGCCCCT 
TTAGGATGAG 
CAGGAGCCTC 
GCGCGCCCCC 
GGACTGCTTC 
CCCCGGCCCG 
CCGCCGGTGC 
GTGCGGCCCG 
GGCGACGAGA 
GACGGCCCCG 
TGGACGCGCC 
GTGTGGCGCT 
GTCCTGATCG 
TTCATGAAGG 
TACGCCTCCA 
GGCTTCTATT 
ACCTGGAACA 
CTGGCCAACC 
GAGAACAAAG 
GTGACCCTTT 
AAAT CCACGG 
CTGCTGGTGC 
CCTGACTGGT 
TTTTCTTACG 
AACAACTGCT 
GCTGGCTTCG 
TCCAAGGTGG 
CTGATGCCAG 
CTCGACAGCC 
GCCTCCTACT 
TTTGTCATCG 
TACT ACT CGG 
GCCTGGGTGT 
CCTTGCCCCT 
TTCATCTTCA 
TGGTGGGGTG 
CACCTCCTGG 
ACCCAGCCCA 
GGCCTGACCA 
ATGTGACAAC 
AGCCCCACCG 
GGGAGGAGGG 
AACGCCAAAA 
AGCTGGTCCT 
CCCTGCCACG 
TGACCCCTCA 
AGAGACGGGA 
CAAATATTTC 
AGCCAGCAAT 
TTGGGTGCGA 
CAAAGGTGAA 
TTTTATAAAA 
CCCAAACCAT 
CTAGCCAAGG 
TGTTGCGTGT 
TTGGAAAAGT 
CTGTGGGGCA 
TCAGGCTTCC 
CGTCCAGGCT 



31 

I 

CCGCCGCGGC 
CCCGAGCCGC 
GCCAGCCGGG 
GCTCCGGCCG 
TCTCGGGTCG 
GGGAGCCGCC 
GGGCCCCCGA 
TGACTGCGCC 
GCCGCCCCCC 
CCCCCGCCTG 
CCGGGGCCAT 
AGAAGGGCCC 
TGGGCCTGGG 
AGATGGACTT 
TCCCCTACCT 
CCCTGGTTGG 
CCGGCAGCAT 
TGGTGATCGT 
ACCTGGT CAA 
CTCCCGACTG 
TCACCTGTGA 
TCTTGAGGCT 
GTCTGCTGGC 
GAAAG AT CGT 
GTGGAGTGCT 
CAAAGCTGGG 
CCATTGGCCT 
ACAAGGACGC 
TGGTCTTCTC 
CAGAGTCAGG 
TGGCCCCACT 
AGTTTGTAGG 
ACTTCCGTTT 
ATCTCTCCAT 
CCAGCGGCAC 
ACGGAGCTGA 
GGATGAAATG 
ACGTTGTGTA 
AGGCCATGGG 
GCTGCCTCCT 
TCTGGGGCCT 
CCCTGACCCC 
TCAGCTCACA 
CACCCCTCCA 
GAGAAAGCAC 
ATATCACAAC 
AGGCCCCGCC 
CCCACCCCCT 
CCCCAGAAGC 
GGGAGGAGAG 
AGCTGGGCTA 
GGAACCTTCT 
GTGCACGCGT 
TGCCAGATGT 
ACTTGAGAGA 
CCTCTCCTTA 
AGTGTGAATT 
GTGAGTCTGT 
GCATGGTGGG 
AGAGGCTGCA 
CACCCTGTGC 
TAAGGTGGAT 



41 

I 

CCCGAGAGCG 
CGCCGCCGCC 
CAGCCTCCGC 
TCGTTTGCAG 
GGCGAGGAGC 
GCCGCCGCCG 
CACACATGAG 
GCCCGCGCCC 
GGCCCCCGGC 
ACCGCCGCCC 
GGCGAAGAAG 
CCTCATCGCG 
GACACCCGGC 
CATCATGTCG 
GTGCTACAAG 
AGGAAT CCCC 
CAATGTCTGG 
CTTCTACTGC 
GTCCTTTACC 
CGTGGAG AT C 
CCAGCTTGCT 
GTCTGGGGGA 
CTGCTGGGTG 
GTACTTCACT 
GCTGCCTGGC 
GTCCCCTCAG 
GGGGGCCCTC 
CATCATCCTG 
CATCCTGGGC 
GCCGGGCCTG 
CTGGGCTGCC 
TGTGGAGGGC 
CCAAAGGGAG 
GGTGACTGAT 
CACCCTGCTC 
CCGCTTCATG 
GTGCTGGTCC 
CTACGAGCCG 
CTGGGCCTTC 
CAGGGCCAAG 
CCACCACTTG 
AGTGT CCGAG 
TCACCAGCTC 
GGGGGCCTGC 
CATGAGTGCT 
CCACCAAAAA 
TAGTGCCCCA 
GCCCACCTCT 
AGCAGTGGCA 
AGAGGAGAAG 
TACCCCTCTC 
GGTTCCTGCG 
GCGTGAGTAC 
AAATGGCGCC 
ATGAGATTTC 
CCACTCCCAT 
TATAGATCTA 
TGTGTGGATG 
GGCCTCGGGG 
ATATTCCGTC 
GGGGCACACC 
GCACTTCCCG 



51 
I 

GCTGCAGCCG 
GCCACCGCCG 
GGGCCCCGGC 
ACCGCGGGCG 
CGCCGCAGCC 
CCGCCGCCCG 
ATTCTTCAGG 
CGCACCCCGC 
CGGCCCGCGC 
CCCGTGAGGC 
AGCGCCGAGA 
CCCGGGCCCG 
GGCCGCCTGG 
TGCGTGGGCT 
AACGGCGGAG 
ATTTTCTTCT 
AACATCTGTC 
AACACCTACT 
ACCACGCTGC 
TTCCGCCATG 
GACCGCCGGT 
CTGGAGGTGC 
CTGGTCTACT 
GCTACATTCC 
GCCCTGGATG 
GTGTGGATAG 
ACAGCCCTGG 
GCTCTCATCA 
TTCATGGCTG 
GCCTTCATCG 
CTGTTCTTCT 
TTCATCACCG 
ATCTCTGTGG 
GGCGGGATGT 
TGGCAGGCCT 
GACGACATTG 
TTCTTCACCC 
CTGGTCTACA 
GCCCTGTCCT 
GGCACCATGG 
GAGTACCGAG 
AGCAGCAAGG 
ACCTCTGGTA 
CTTTCCCTGA 
CACTAAAACA 
TAGATGCCTC 
CCCCCACCCA 
CCAGGCTCTG 
GCTTGGGAAA 
GGAGGCAGGG 
CCCATCCCTG 
CCAATCGCCA 
GGAGAGTATA 
TCTGGGCAAA 
TGCTTGTATA 
CCCTGTGAGC 
ACTTTCATAG 
TGCGTGTGTG 
CTGTCCCCAC 
CTGGGTGTCT 
CCCAGGAAGG 
CACCTCCAGT 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
720 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 
2280 
2340 
2400 
2460 
2520 
2580 
2640 
2700 
2760 
2820 
2880 
2940 
3000 
3060 
3120 
3180 
3240 
3300 
3360 
3420 
3480 
3540 
3600 
3660 
3720 



213 



WO 02/086443 

CTTCTGTGTA GCAGCTTTAA CCCACGTTTG TCTGTCACGT CCAGTCCCGA GACGGCTGAG 3780 

TGACCCCAAG AAAGGCTTCC CCGACACCCA GACAGAGGCT GCAGGGCTGG GGCTGGGTGA 384.0 

GGGTGGCGGG CCTGCGGGGA CATT CTACTG TGCTAAAAAG CCACTGCAGA CATAGCAATA 3900 
AAAACATGTC ATTTTCC 



PCT/US02/12476 



Seq ID NO: 67 Protein sequence: 
Protein Accession #: NP 005620.1 



10 



15 



20 



1 11 21 31 41 51 

I I I I I I 

MAKKSAENGI YSVSGDEKKG PL I APGPDGA PAKGDGPVGL GTPGGRLAVP PRETWTRQMD 60 

FIMSCVGFAV GLGNVWRPPY LCYKNGGGVF LTPYVLIALV GGIPIFFLEI SLGQFMKAGS 12 0 

INVWNICPLF KGLGYASMVI VFYCNTYYIM VLAWGFYYLV KSFTTTLPWA TCGHTWNTPD 180 

CVEIFRHEDC ANASLANLTC DQLADRRSPV IEFWENKVLR DSGGLEVPGA LNWEVTLCLL 240 

ACWVLVYFCV WKGVKSTGKI VYFTATFPYV VLWLLVRGV LLPGALDGI I YYLKPDWSKL 300 

GSPQVWIDAG TQIFFSYAIG LGALTALGSY NRFNNNCYKD AIILALINSG TSFFAGFWF 360 

SILGFMAAEQ GVHISKVAES G P GliAF I A YP RAVTLMPVAP LWAALFFFML LLLGLDSQFV 42 0 

GVEGFITGLL DLLPASYYFR FQREISVALC CALCFVIDLS MVTDGGMYVF QLFDYYSASG 480 

TTLLWQAFWE CWVAWVYGA DRFMDD I ACM IGYRPCPWMK WCWSFFTPLV CMGIFIFNW 540 

YYEPLVYNNT YVYPWWGEAM GWAFALSSML CVPLHLLGCL LRAKGTMAER WQHLTQPIWG 600 
LHHLEYRAQD ADVRGLTTLT PVSESSKWV VESVM 
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Seq ID NO: 68 DNA sequence 

Nucleic Acid Accession #: NM_021953.1 

Coding sequence: 178-2469 

1 '11 21 31 41 51 

I 1 I I I I 

GGCACGAGGG GGACCCGGCC GGTCCGGCGC GAGCCCCCGT CCGGGGCCCT GGCTCGGCCC 60 

CCAGGTTGGA GGAGCCCGGA GCCCGCCTTC GGAGCTACGG CCTAACGGCG GCGGCGACTG 120 

CAGTCTGGAG GGTCCACACT TGTGATTCTC AATGGAGAGT GAAAACGCAG ATT CATAATG 180 

AAAGCTAGCC CCCGTCGGCC ACTGATTCTC AAAAGACGGA GGCTGCCCCT TCCTGTTCAA 240 

AATGCCCCAA GTGAAACATC AGAGGAGGAA CCTAAGAGAT CCCCTGCCCA ACAGGAGTCT 3 00 

AATCAAGCAG AGGCCTCCAA GGAAGTGGCG GAGTCCAACT CTTGCAAGTT TCCAGCTGGG 360 

ATCAAGATTA TTAACCACCC CACCATGCCC AACACGCAAG TAGTGGCCAT CCCCAACAAT 42 0 

GCTAATATTC ACAGCATCAT CACAGCACTG ACTGCCAAGG GAAAAGAGAG TGGCAGTAGT 480 

GGGCCCAACA AATTCATCCT CATCAGCTGT GGGGGAGCCC CAACTCAGCC TCCAGGACTC 540 

CGGCCTCAAA CCCAAACCAG CTATGATGCC AAAAGGACAG AAGTGACCCT GGAGACCTTG 60 0 

GGACCAAAAC CTGCAGCTAG GGATGTGAAT CTT CCTAGAC CACCTGGAGC CCTTTGCGAG 660 

CAGAAACGGG AGACCTGTGC AGATGGTGAG GCAGCAGGCT GCACTATCAA CAATAGCCTA 720 

TCCAACATCC AGTGGCTTCG AAAGATGAGT TCTGATGGAC TGGGCTCCCG CAGCATCAAG 780 

CAAGAGATGG AGGAAAAGGA GAATTGTCAC CTGGAGCAGC GACAGGTTAA GGTTGAGGAG 840 

CCTTCGAGAC CATCAGCGTC CTGGCAGAAC TCTGTGTCTG AGCGGCCACC CTACTCTTAC 900 

ATGGCCATGA TACAATTCGC CAT CAACAGC ACTGAGAGGA AGCGCATGAC TTTGAAAGAC 960 

AT CTAT ACGT GGATTGAGGA CCACTTTCCC TACTTTAAGC ACATTGCCAA GCCAGGCTGG 102 0 

AAGAACTCCA TCCGCCACAA CCTTTCCCTG CACGACATGT TTGTCCGGGA GACGTCTGCC 1080 

AATGGCAAGG TCTCCTTCTG GACCATTCAC CCCAGTGCCA ACCGCTACTT GACATTGGAC 1140 

CAGGTGTTTA AGCCACTGGA CCCAGGGTCT CCACAATTGC CCGAGCACTT GGAATCACAG 12 00 

CAGAAACGAC CGAATCCAGA GCTCCGCCGG AACATGACCA T C AAAACCGA ACTCCCCCTG 12 6 0 

GGCGCACGGC GGAAGATGAA GCCACTGCTA CCACGGGTCA GCTCATACCT GGTACCTATC 132 0 

CAGTTCCCGG TGAACCAGTC ACTGGTGTTG CAGCCCTCGG TGAAGGTGCC ATTGCCCCTG 1380 

GCGGCTTCCC TCATGAGCTC AGAGCTTGCC CGCCATAGCA AGCGAGTCCG CATTGCCCCC 1440 

AAGGTGCTGC TAGCTGAGGA GGGGATAGCT CCTCTTTCTT CTGCAGGACC AGGGAAAGAG 1500 

GAGAAACTCC TGTTTGGAGA AGGGTTTTCT CCTTTGCTTC CAGTTCAGAC TATCAAGGAG 1560 

GAAGAAATCC AGCCTGGGGA GGAAATGCCA CACTTAGCGA GACCCATCAA AGTGGAGAGC 1620 

CCTCCCTTGG AAGAGTGGCC CTCCCCGGCC CCATCTTTCA AAGAGGAATC ATCTCACTCC 1680 

TGGGAGGATT CGTCCCAATC TCCCACCCCA AGACCCAAGA AGTCCTACAG TGGGCTTAGG 1740 

TCCCCAACCC GGTGTGTCTC GGAAATGCTT GTGATTCAAC ACAGGGAGAG GAGGGAGAGG 1800 

AGCCGGTCTC GGAGGAAACA GCATCTACTG CCTCCCTGTG TGGATGAGCC GGAGCTGCTC 1860 

TTCTCAGAGG GGCCCAGTAC TTCCCGCTGG GCCGCAGAGC TCCCGTTCCC AGCAGACTCC 192 0 

TCTGACCCTG CCTCCCAGCT CAGCTACTCC CAGGAAGTGG GAGGACCTTT TAAGACACCC 1980 

ATTAAGGAAA CGCTGCCCAT CTCCTCCACC CCGAGCAAAT CTGTCCTCCC CAGAACCCCT 2 040 

GAAT CCTGGA GGCTCACGCC CCCAGCCAAA GTAGGGGGAC TGGATTTCAG CCCAGTACAA 210 0 

ACCTCCCAGG GTGCCTCTGA CCCCTTGCCT GACCCCCTGG GGCTGATGGA TCTCAGCACC 2160 

ACTCCCTTGC AAAGTGCTCC CCCCCTTGAA TCACCGCAAA GGCTCCTCAG TTCAGAACCC 2220 

TTAGACCTCA TCTCCGTCCC CTTTGGCAAC TCTTCTCCCT CAGATATAGA CGTCCCCAAG 2280 

CCAGGCTCCC CGG AG CCACA GGTTTCTGGC CTTGCAGCCA ATCGTTCTCT GACAGAAGGC 2340 

CTGGTCCTGG A C AC AATGAA TGACAGCCTC AGCAAGATCC TGCTGGACAT CAGCTTTCCT 2400 

GGCCTGGACG AGGACCCACT GGGCCCTGAC AACATCAACT GGTCCCAGTT TATTCCTGAG 2460 

CTACAGTAGA GCCCTGCCCT TGCCCCTGTG CTCAAGCTGT CCACCATCCC GGGCACTCCA 2520 

AGGCTCAGTG CACCCCAAGC CTCTGAGTGA GGACAGCAGG CAGGGACTGT TCTGCTCCTC 2580 

ATAGCTCCCT GCTGCCTGAT TATGCAAAAG TAGCAGTCAC ACCCTAGCCA CTGCTGGGAC 2 640 

CTTGTGTTCC CCAAGAGTAT CTGATTCCTC TGCTGTCCCT GCCAGGAGCT GAAGGGTGGG 2 700 

AACAACAAAG GCAATGGTGA AAAGAGATTA GGAACCCCCC AGCCTGTTTC CATTCTCTGC 2760 

CCAGCAGTCT CTTACCTTCC CTGATCTTTG CAGGGTGGTC CGTGTAAATA GTATAAATTC 282 0 

TCCAAATTAT CCTCTAATTA TAAATGTAAG CTTATTTCCT TAGATCATTA T CCAGAGACT 2880 

GCCAGAAGGT GGGTAGGATG ACCTGGGGTT TCAATTGACT TCTGTTCCTT GCTTTTAGTT 2 940 

TTGATAGAAG GGAAGACCTG CAGTGCACGG TTTCTTCCAG GCTGAGGTAC CTGGAT CTTG 3000 

GGTTCTTCAC TGCAGGGACC CAGACAAGTG GATCTGCTTG CCAGAGTCCT TTTTGCCCCT 3 0 60 

CCCTGCCACC TCCCCGTGTT TCCAAGTCAG CTTTCCTGCA AGAAGAAATC CTGGTTAAAA 3120 

AAGTCTTTTG TATTGGGTCA GGAGTTGAAT TTGGGGTGGG AGGATGGATG CAACTGAAGC 3180 

AGAGTGTGGG TGCCCAGATG TGCGCTATTA GATGTTTCTC TGATAATGTC CCCAAT CAT A 3240 

CCAGGGAGAC TGGCATTGAC GAGAACTCAG GTGGAGGCTT GAGAAGGCCG AAAGGGCCCC 33 00 

TGACCTGCCT GGCTTCCTTA GCTTGCCCCT CAGCTTTGCA AAGAGCCACC CTAGGCCCCA 3360 

GCTGACCGCA TGGGTGTGAG CCAGCTTGAG AACACTAACT ACTCAATAAA AGCGAAGGTG 3420 
GACCNAAAAA AAAAAAAAAA AAAA 
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WO 02/086443 



PCT/US02/12476 



Seq ID NO: 69 Protein sequence: 
Protein Accession #: NP 0 68772.1 
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MKASPRRPLI 
GIKIINHPTM 
LRPQTQTSYD 
LSNIQWLRKM 
YMAMIQFAIN 
ANGKVSFWTI 
LGARRKMKPL 
PKVLLAEEGI 
SPPLEEWPSP 
RSRSRRKQHL 
PIKETLPISS 
TTPLQSAPPL 
GLVI/DTMNDS 



LKRRRLPLPV 
PNTQWAIPN 
AKRTEVTLET 
SSDGLGSRSI 
STERKRMTLK 
HPSANRYLTL 
LPRVSSYLVP 
APLSSAGPGK 
APSFKEESSH 
LPPCVDEPEL 
TPSKSVLPRT 
ESPQRLLSSE 
LSKILLDISF 



21 
I 

QNAPSETSEE 
NANIHSIITA 
LGPKPAARDV 
KQEMEEKENC 
DIYTWIEDHF 
DQVFKPLDPG 
IQFPVNQSLV 
EEKLLFGEGF 
SWEDSSQSPT 
LFSEGPSTSR 
PESWRLTPPA 
PLDLISVPFG 
PGLDEDPLGP 



31 
I 

EPKRSPAQQE 
LTAKGKESGS 
NLPRPPGALC 
HLEQRQVKVE 
PYFKHIAKPG 
SPQLPEHLES 
LQPSVKVPLP 
SPLLPVQTIK 
PRPKKSYSGL 
WAAELPFPAD 
KVGGLDF S P V 
NSSPSDIDVP 
DNINWSQFIP 



41 

I 

SNQAEASKEV 
SGPNKFILIS 
EQKRETCADG 
EPSRPSASWQ 
WKNSIRHNLS 
QQKRPNPELR 
LAASLMSSEL 
EEEIQPGEEM 
RSPTRCVSEM 
SSDPASQLSY 
QTSQGASDPL 
KPGSPEPQVS 
ELQ 



51 
I 

AESNSCKFPA 60 

CGGAPTQPPG 12 0 

EAAGCTINNS 180 

NSVSERPPYS 240 

LHDMFVRETS 300 

RNMTIKTEIiP 360 

ARHSKRVRIA 420 

PHLARPIKVE 480 

LVIQHRERRE 540 

SQEVGGPFKT 600 

PDPLGLMDLS 660 

GLAANRSLTE 72 0 
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Seq ID NO: 70 DNA sequence 

Nucleic Acid Accession #: BC006529.1 

Coding sequence: 178-2424 
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GGCACGAGGG 
CCAGGTTGGA 
CAGTCTGGAG 
AAAACTAGCC 
AATGCCCCAA 
AATCAAGCAG 
ATCAAGATTA 
GCTAATATTC 
GGGCCCAACA 
CGGCCTCAAA 
GGACCAAAAC 
CAGAAACGGG 
TCCAACATCC 
CAAGAGATGG 
CCTTCGAGAC 
ATGGCCATGA 
ATCTATACGT 
AAGAACT CCA 
AATGGCAAGG 
CAGGTGTTTA 
ACCGAACTCC 
TACCTGGTAC 
GTGCCATTGC 
GTCCGCATTG 
GGACCAGGGA 
CAGACTATCA 
ATCAAAGTGG 
G AAT CAT CTC 
TACAGTGGGC 
GAGAGGAGGG 
GAGCCGGAGC 
TTCCCAGCAG 
CCTTTTAAGA 
CTCCCCAGAA 
TTCAGCCCAG 
ATGGATCTCA 
CTCAGTTCAG 
ATAGACGTCC 
TCTCTGACAG 
GACATCAGCT 
CAGTTTATTC 
ATCCCGGGCA 
ACTGTTCTGC 
AGCCACTGCT 
GAGCTGAAGG 
GTTTCCATTC 
AAATAGTATA 
CATTAT CCAG 
TCCTTGCTTT 
GGTACCTGGA 
GTCCTTTTTG 
AAATCCTGGT 
GGATGCAACT 
ATGTCCCCAA 
GGCCGAAAGG 
CCACCCTAGG 
AT AAAAG CGA 



GGACCCGGCC 

GGAGCCCGGA 

GGTCCACACT 

CCCGTCGGCC 

GTGAAACATC 

AGGCCTCCAA 

TTAACCACCC 

ACAGCATCAT 

AATTCATCCT 

CCCAAACCAG 

CTGCAGCTAG 

AGACCTGTGC 

AGTGGCTTCG 

AGGAAAAGGA 

CATCAGCGTC 

TACAATTCGC 

GGATTGAGGA 

TCCGCCACAA 

TCTCCTTCTG 

AG C AGCAG AA 

CCCTGGGCGC 

CTATCCAGTT 

CCCTGGCGGC 

CCCCCAAGGT 

AAGAGGAGAA 

AGGAGGAAGA 

AGAGCCCTCC 

ACTCCTGGGA 

TTAGGTCCCC 

AG AGG AG CCG 

TGCTCTTCTC 

ACTCCTCTGA 

CACCCATTAA 

CCCCTGAATC 

TACAAACCCC 

GCACCACTCC 

AACCCTTAGA 

CCAAGCCAGG 

AAGGCCTGGT 

TTCCTGGCCT 

CTGAGCTACA 

CTCCAAGGCT 

TCCTCATAGC 

GGGACCTTGT 

GTGGGAACAA 

TCTGCCCAGC 

AATTCTCCAA 

AGACTGCCAG 

TAGTTTTGAT 

TCTTGGGTTC 

CCCCTCCCTG 

TAAAAAAGTC 

GAAGCAGAGT 

TCATACCAGG 

GCCCCTGACC 

CCCCAGCTGA 

AGGTGGAAAA 



21 
I 

GGTCCGGCGC 
GCCCGCCTTC 
TGTGATTCTC 
ACTGATTCTC 
AGAGGAGGAA 
GGAAGTGGCA 
CACCATGCCC 
CACAGCACTG 
CATCAGCTGT 
CTATGATGCC 
GGATGTGAAT 
AGATGGTGAG 
AAAGATGAGT 
GAATTGTCAC 
CTGGCAGAAC 
CATCAACAGC 
CCACTTTCCC 
CCTTTCCCTG 
GACC AT TCAC 
ACGACCGAAT 
ACGGCGGAAG 
CCCGGTGAAC 
TTCCCTCATG 
GCTGCTAGCT 
ACTCCTGTTT 
AATCCAGCCT 
CTTGGAAGAG 
GGATTCGTCC 
AACCCGGTGT 
GTCTCGGAGG 
AGAGGGGCCC 
CCCTGCCTCC 
GGAAACGCTG 
CTGGAGGCTC 
CCAGGGTGCC 
CTTGCAAAGT 
CCTCATCTCC 
CTCCCCGGAG 
CCTGGACACA 
GGACGAGGAC 
GTAGAGCCCT 
CAGTGCACCC 
TCCCTGCTGC 
GTTCCCCAAG 
CAAAGGCAAT 
AGTCTCTTAC 
ATTATCCTCT 
AAGGTGGGTA 
AGAAGGGAAG 
TTCACTGCAG 
CCACCTCCCC 
TTTTGTATTG 
GTGGGTGCCC 
GAGACTGGCA 
TGCCTGGCTT 
CCGCATGGGT 
AAAAAAAAAA 



31 
I 

GAGCCCCCGT 
GGAGCTACGG 
AATGGAGAGT 
AAAAGACGGA 
CCTAAGAGAT 
GAGTCCAACT 
AACACGCAAG 
ACTGCCAAGG 
GGGGGAGCCC 
AAAAGGACAG 
CTTCCTAGAC 
GCAGCAGGCT 
TCTGATGGAC 
CTGGAGCAGC 
TCTGTGTCTG 
ACTGAGAGGA 
TACT TTAAGC 
CACGACATGT 
CCCAGTGCCA 
CCAGAGCTCC 
ATGAAGCCAC 
CAGTCACTGG 
AGCTCAGAGC 
GAGGAGGGGA 
GGAGAAGGGT 
GGGGAGGAAA 
TGGCCCTCCC 
CAATCTCCCA 
GTCTCGGAAA 
AAACAGCATC 
AGTACTTCCC 
CAGCTCAGCT 
CCCATCTCCT 
ACGCCCCCAG 
TCTGACCCCT 
GCTCCCCCCC 
GTCCCCTTTG 
CCACAGGTTT 
ATGAATGACA 
CCACTGGGCC 
GCCCTTGCCC 
CAAGCCTCTG 
CTGATTATGC 
AGTATCTGAT 
GGTGAAAAGA 
CTTCCCTGAT 
AATTATAAAT 
GGATGACCTG 
ACCTGCAGTG 
GGACCCAGAC 
GTGTTTCCAA 
GGTCAGGAGT 
AGATGTGCGC 
TTGACGAGAA 
CCTTAGCTTG 
GTGAGCCAGC 
AAAAAAA 



41 



CCGGGGCCCT 
CCTAACGGCG 
GAAAACGCAG 
GGCTGCCCCT 
CCCCTGCCCA 
CTTGCAAGTT 
TAGTGGCCAT 
GAAAAGAGAG 
CAACTCAGCC 
AAGTGACCCT 
CACCTGGAGC 
GCACTAT CAA 
TGGGCTCCCG 
GACAGGTTAA 
AGCGGCCACC 
AGCGCATGAC 
ACATTGCCAA 
TTGTCCGGGA 
ACCGCTACTT 
GCCGGAACAT 
TGCTACCACG 
TGTTGCAGCC 
TTGCCCGCCA 
TAGCTCCTCT 
TTTCTCCTTT 
TGCCACACTT 
CGGCCCCATC 
CCCCAAGACC 
TGCTTGTGAT 
TACTGCCTCC 
GCTGGGCCGC 
ACTCCCAGGA 
CCACCCCGAG 
CCAAAGTAGG 
TGCCTGACCC 
TTGAATCACC 
GCAACTCTTC 
CTGGCCTTGC 
GCCTCAGCAA 
CTGACAACAT 
CTGTGCTCAA 
AGTGAGGACA 
AAAAGTAGCA 
TCCTCTGCTG 
GATTAGGAAC 
CTTTGCAGGG 
GTAAGCTTAT 
GGGTTTCAAT 
CACGGTTTCT 
AAGTGGATCT 
GTCAGCTTTC 
TGAATTTGGG 
TATTAGATGT 
CTCAGGTGGA 
CCCCTCAGCT 
TTGAGAACAC 



51 
! 

GGCTCGGCCC 60 

GCGGCGACTG 120 

AT T C ATAATG 180 

TCCTGTTCAA 240 

ACAGGAGTCT 300 

TCCAGCTGGG 360 

CCCCAACAAT 42 0 

TGGCAGTAGT 480 

TCCAGGACTC 540 

GGAGACCTTG 600 

CCTTTGCGAG 660 

CAATAGCCTA 720 

CAGCAT CAAG 780 

GGTTGAGGAG 840 

CTACTCTTAC 900 

TTTGAAAGAC 960 

GCCAGGCTGG 1020 

GACGTCTGCC 1080 

GACATTGGAC 1140 

G AC CAT CAAA 1200 

GGTCAGCTCA 1260 

CTCGGTGAAG 1320 

TAGCAAGCGA 1380 

TTCTTCTGCA 1440 

GCTTCCAGTT 1500 

AG CGAGACCC 1560 

TTTCAAAGAG 1620 

CAAGAAGTCC 1680 

TCAACACAGG 1740 

CTGTGTGGAT 1800 

AGAGCTCCCG 1860 

AGTGGGAGGA 192 0 

CAAATCTGTC 1980 

GGGACTGGAT 2040 

CCTGGGGCTG 2100 

GCAAAGGCTC 2160 

TCCCTCAGAT 222 0 

AGCCAATCGT 22 80 

GATCCTGCTG 2340 

CAACTGGTCC 240 0 

GCTGTCCACC 2460 

GCAGGCAGGG 2520 

GTCACACCCT 2580 

TCCCTGCCAG 2640 

CCCCCAGCCT 2700 

TGGTCCGTGT 2760 

TTCCTTAGAT 2 820 

TGACTTCTGT 2880 

TCCAGGCTGA 2940 

GCTTGCCAGA 3000 

CTGCAAGAAG 30 60 

GTGGGAGGAT 3120 

TTCTCTGATA 3180 

GGCTTGAGAA 3240 

TTGCAAAGAG 3300 

TAACT ACT CA 3 3 60 



Seq ID NO: 71 Protein sequence: 
Protein Accession #: AAH06529.1 



215 



WO 02/086443 



PCT/US02/12476 



1 11 21 31 41 51 

I 1 I I I 1 

MKTSPRRPLI LKRRRLPLPV QNAPSETSEE EPKRSPAQQE SNQAEASKEV AESNSCKFPA 60 

5 GIKIINHPTM PNTQWAIPN NANIHSIITA LTAKGKESGS SGPNKFILIS CGGAPTQPPG 120 

LRPQTQTSYD AKRTEVTLET LGPKPAARDV NLPRPPGALC EQKRETCADG EAAGCTINNS 180 

LSNIQWLRKM SSDGLGSRSI KQEMEEKENC HLEQRQVKVE EPSRPSASWQ NSVSERPPYS 240 

YMAMIQFAIN STERKRMTLK DIYTWIEDHF PYFKHIAKPG WKNS I RHNL S LHDMFVRETS 3 00 

ANGKVS FWT I HPSANRYLTL DQVFKQQKRP NPELRRNMTI KTELPLGARR KMKPLLPRVS 360 

10 SYLVPIQFPV NQSLVLQPSV KVPLPLAASL MSSELARHSK RVRIAPKVLL AEEGIAPLSS 420 

AGPGKEEKLL FGEGFSPLLP VQTIKEEEIQ PGEEMPHLAR PIKVESPPLE EWPSPAPSFK 480 

EESSHSWEDS SQSPTPRPKK SYSGLRSPTR CVSEMLVIQH RERRERSRSR RKQHLLPPCV 540 

DEPELLFSEG PSTSRWAAEL PFPADSSDPA SQLSYSQEVG GPFKTPIKET LPISSTPSKS 600 

VLPRTPESWR LTPPAKVGGL DFSPVQTPQG ASDPLPDPLG LMDLSTTPLQ SAPPLESPQR 660 

15 LLSSEPLDLI SVPFGNSSPS DIDVPKPGSP EPQVSGLAAN RSLTEGLVLD TMNDSLSKIL 720 
LDISFPGLDE DPLGPDNINW SQFIPELQ 

Seq ID NO: 72 DNA sequence 
20 Nucleic Acid Accession #: U74612.1 
Coding sequence: 178-2583 

1 11 21 31 41 51 

o« I I I I 1 1 

Zj ggcacgaggg ggacccggcc ggtccggcgc gagcccccgt CCGGGGCCCT GGCTCGGCCC 60 

CCAGGTTGGA GGAGCCCGGA GCCCGCCTTC GGAGCTACGG CCTAACGGCG GCGGCGACTG 120 

CAGTCTGGAG GGTCCACACT TGTGATTCTC AATGGAGAGT GAAAACGCAG ATTCATAATG 180 

AAAACTAGCC CCCGTCGGCC ACTGATTCTC AAAAGACGGA GGCTGCCCCT TCCTGTTCAA N 240 

AATGCCCCAA GTGAAAC AT C AGAGGAGGAA CCTAAGAGAT CCCCTGCCCA ACAGGAGTCT 300 

30 AATCAAGCAG AGGCCTCCAA GGAAGTGGCA GAGTCCAACT CTTGCAAGTT TCCAGCTGGG 3 60 

ATCAAGATTA TTAACCACCC CACCATGCCC AACACGCAAG TAGTGGCCAT CCCCAACAAT 420 

GCTAAT ATT C ACAGCATCAT CACAGCACTG ACTGCCAAGG GAAAAGAGAG TGGCAGTAGT 480 

GGGCCCAACA AATTCATCCT CATCAGCTGT GGGGGAGCCC CAACTCAGCC TCCAGGACTC 540 

CGGCCTCAAA CCCAAACCAG CTATGATGCC AAAAGGACAG AAGTGACCCT GGAGACCTTG 600 

35 GGACCAAAAC CTGCAGCTAG GGATGTGAAT CTTCCTAGAC CACCTGGAGC CCTTTGCGAG 660 

CAGAAACGGG AG ACCTGTG C AGATGGTGAG GCAGCAGGCT GCACTATCAA CAATAGCCTA 720 

TCCAACATCC AGTGGCTTCG AAAGATGAGT TCTGATGGAC TGGGCTCCCG CAGCATCAAG 7 80 

CAAGAGATGG AGGAAAAGGA GAATTGT CAC CTGGAGCAGC GACAGGTTAA GGTTGAGGAG 840 

CCTTCGAGAC CATCAGCGTC CTGGCAGAAC TCTGTGTCTG AGCGGCCACC CTACTCTTAC 900 

40 ATGGCCATGA TACAATTCGC CATCAACAGC ACTGAGAGGA AGCGCATGAC TTTGAAAGAC 960 

ATCTATACGT GGATTGAGGA CCACTTTCCC TACTTTAAGC ACATTGCCAA GCCAGGCTGG 1020 

AAGAACTCCA TCCGCCACAA CCTTTCCCTG CACGACATGT TTGTCCGGGA GACGTCTGCC 1080 

AATGGCAAGG TCTCCTTCTG GACCATTCAC CCCAGTGCCA ACCGCTACTT GACATTGGAC 1140 

CAGGTGTTTA AGCCACTGGA CCCAGGGTCT CCACAATTGC CCGAGCACTT GGAATCACAG 120 0 

45 CAGAAACGAC CGAAT CCAGA GCTCCGCCGG AACATGACCA TCAAAACCGA ACTCCCCCTG 12 60 

GGCGCACGGC GGAAGATGAA GCCACTGCTA CCACGGGTCA GCTCATACCT GGTACCTATC 1320 

CAGTTCCCGG TGAACCAGTC ACTGGTGTTG CAGCCCTCGG TGAAGGTGCC ATTGCCCCTG 1380 

GCGGCTTCCC TCATGAGCTC AGAGCTTGCC CGCCATAGCA AGCGAGTCCG CATTGCCCCC 1440 

AAGGTTTTTG GGGAACAGGT GGTGTTTGGT TACATGAGTA AGTTCTTTAG TGGCG AT CTG 1500 

50 CGAGATTTTG GTACACCCAT CACCAGCTTG TTTAATTTTA TCTTTCTTTG TTTATCAGTG 1560 

CTGCTAGCTG AGGAGGGGAT AGCTCCTCTT TCTTCTGCAG GACCAGGGAA AGAGGAGAAA 1620 

CTCCTGTTTG GAGAAGGGTT TTCTCCTTTG CTTCCAGTTC AGACTATCAA GGAGGAAGAA 1680 

ATCCAGCCTG GGGAGGAAAT GCCACACTTA GCGAGACCCA TCAAAGTGGA GAGCCCTCCC 1740 

TTGGAAGAGT GGCCCTCCCC GGCCCCATCT TTCAAAGAGG AATCATCTCA CTCCTGGGAG 1800 

55 GATTCGTCCC AATCTCCCAC CCCAAGACCC AAGAAGTCCT ACAGTGGGCT TAGGTCCCCA 1860 

ACCCGGTGTG TCT CGGAAAT GCTTGTGATT CAACACAGGG AGAGGAGGGA GAGGAGCCGG 1920 

TCTCGGAGGA AACAGCATCT ACTGCCTCCC TGTGTGGATG AGCCGGAGCT GCTCTTCTCA 1980 

GAGGGGCCCA GTACTTCCCG CTGGGCCGCA GAGCTCCCGT TCCCAGCAGA CTCCTCTGAC 2040 

CCTGCCTCCC AGCTCAGCTA CTCCCAGGAA GTGGGAGGAC CTTTTAAGAC ACCCATTAAG 2100 

60 GAAACGCTGC CCATCTCCTC CACCCCGAGC AAATCTGTCC TCCCCAGAAC CCCTGAATCC 2160 

TGGAGGCT C A CGCCCCCAGC CAAAGTAGGG GGACTGGATT TCAGCCCAGT ACAAACCTCC 2220 

CAGGGTGCCT CTGACCCCTT GCCTGACCCC CTGGGGCTGA TGGATCTCAG CACCACTCCC 2280 

TTGCAAAGTG CTCCCCCCCT TGAATCACCG CAAAGGCTCC TCAGTTCAGA ACCCTTAGAC 2340 

CTCATCTCCG TCCCCTTTGG CAACTCTTCT CCCTCAGATA TAGACGTCCC CAAGCCAGGC 2400 

65 TCCCCGGAGC CACAGGTTTC TGGCCTTGCA GCCAATCGTT CTCTGACAGA AGGCCTGGTC 2460 

CTGGACACAA TGAATGACAG CCTCAGCAAG ATCCTGCTGG ACATCAGCTT TCCTGGCCTG 2520 

GACGAGGACC CACTGGGCCC TGACAACATC AACTGGTCCC AGTTTATTCC TGAGCTACAG 2580 

TAGAGCCCTG CCCTTGCCCC TGTGCTCAAG CTGTCCACCA TCCCGGGCAC TCCAAGGCTC 2640 

AGTGCACCCC AAGCCTCTGA GTGAGGACAG CAGGCAGGGA CTGTTCTGCT CCTCATAGCT 2700 

70 CCCTGCTGCC TGATTATGCA AAAGTAGCAG TCACACCCTA GCCACTGCTG GGACCTTGTG 2 760 

TTCCCCAAGA GTATCTGATT CCTCTGCTGT CCCTGCCAGG AGCTGAAGGG TGGGAACAAC 2 82 0 

AAAGGCAATG GTGAAAAGAG ATTAGGAACC CCCCAGCCTG TTTCCATTCT CTGCCCAGCA 2880 

GTCTCTTACC TTCCCTGATC TTTGCAGGGT GGTCCGTGTA AATAGTATAA ATTCTCCAAA 2940 

TTATCCTCTA ATTATAAATG TAAG CTTATT TCCTTAGATC ATTATCCAGA GACTGCCAGA 3000 

75 AGGTGGGTAG GATGACCTGG GGTTTCAATT GACTTCTGTT CCTTGCTTTT AGTTTTGATA 30 60 

GAAGGGAAGA CCTGCAGTGC ACGGTTTCTT CCAGGCTGAG GTACCTGGAT CTTGGGTTCT 3120 

TCACTGCAGG GACCCAGACA AGTGGATCTG CTTGCCAGAG TCCTTTTTGC CCCTCCCTGC 3180 

CACCTCCCCG TGTTTCCAAG TCAGCTTTCC TGCAAGAAGA AATCCTGGTT AAAAAAGTCT 3240 

TTTGTATTGG GTCAGGAGTT GAATTTGGGG TGGGAGGATG GATGCAACTG AAGCAGAGTG 3300 

80 TGGGTGCCCA GATGTGCGCT ATTAGATGTT TCTCTGATAA TGTCCCCAAT CATACCAGGG 3360 

AGACTGGCAT TGACGAGAAC TCAGGTGGAG GCTTGAGAAG GCCGAAAGGG CCCCTGACCT 3420 

GCCTGGCTTC CTTAGCTTGC CCCTCAGCTT TGCAAAGAGC CACCCTAGGC CCCAGCTGAC 3480 

CGCATGGGTG TGAGCCAGCT TGAGAACACT AACTACTCAA TAAAAGCGAA GGTGGACAAA 3540 
AAAAAAAAAA AAAAA 



85 



Seq ID NO: 73 Protein sequence: 
Protein Accession #: AAC51128.1 



216 



WO 02/086443 



1 
I 

MKTSPRRPLI 
GIKI INHPTM 
LRPQTQTSYD 
LSNIQWLRKM 
YMAMIQFAIN 
ANGKVSFWTI 
LGARRKMKPL 
PKVFGEQWF 
KLLFGEGFSP 
EDSSQSPTPR 
SEGPSTSRWA 
SWRLTPPAKV 
DLISVPFGNS 
LDEDPLGPDN 



11 

I 

LKRRRLPLPV 
PNTQWAIPN 
AKRTEVTLET 
SSDGLGSRSI 
STERKRMTLK 
HPSANRYLTL 
LPRVSSYIiVP 
GYMSKFFSGD 
LLPVQTIKEE 
PKKSYSGLRS 
AELPFPADSS 
GGLDFSPVQT 
SPSDIDVPKP 
INWSQFIPEL 



21 
I 

QNAPSETSEE 
NANIHSIITA 
LGPKPAARDV 
KQEMEEKENC 
DIYTWIEDHF 
DQVFKPLDPG 
IQFPVNQSLV 
LRDFGTPITS 
EIQPGEEMPH 
PTRCVSEMLV 
DPASQLSYSQ 
SQGASDPLPD 
GSPEPQVSGL 
Q 



31 

I 

EPKRSPAQQE 
LTAKGKESGS 
NLPRPPGALC 
HLEQRQVKVE 
PYFKHIAKPG 
SPQLPEHLES 
LQPSVKVPLP 
LFNFIFLCLS 
LARPIKVESP 
IQHRERRERS 
EVGGPFKTP I 
PLGLMDLSTT 
AANRSLTEGL 



41 
I 

SNQAEASKEV 
SGPNKFILIS 
EQKRETCADG 
EPSRPSASWQ 
WKNSIRHNLS 
QQKRPNPELR 
LAASLMSSEL 
VLLAEEGIAP 
PLEEWPSPAP 
RSRRKQHLLP 
KETLPISSTP 
PLQSAPPLES 
VLDTMND S Ii S 



51 
I 

AESNSCKFPA 
CGGAPTQPPG 
EAAGCT INNS 
NSVSERPPYS 
LHDMFVRETS 
RNMTIKTELP 
ARHSKRVRIA 
LSSAGPGKEE 
SFKEESSHSW 
PCVDEPELLF 
SKSVLPRTPE 
PQRLLSSEPL 
KILLDISFPG 



Seq ID NO: 74 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 111-416 



1 11 21 31 41 51 

I 1 I I I I 

GGGAAGAGCC AGGCTGAGCC TTATAAAGGA CTGCTCTTTG TCCAAACACA CACATCTCAC 

TCATCCTTCT ACTCGTGACG CTTCCCAGCT CTGGCTTTTT GAAAGCAAAG ATGAGCAACA 

CTCAAGCTGA GAGGTCCATA ATAGGCATGA TCGACATGT T TCACAAATAC ACCAGACGTG 

ATGACAAGAT TGAGAAGCCA AGCCTGCTGA CGATGATGAA GGAGAACTTG CCCAACTTCC 

TTAGTGCCTG TGACAAAAAG GGCACAAATT ACCTCGCCGA TGTCTTTGAG AAAAAGGACA 

AGAATGAGGA TAAGAAGATT GATTTTTCTG AGTTTCTGTC CTTGCTGGGA GACATAGCCA 

CAGACTACCA CAAGCAGAGC CATGGAGCAG CGCCCTGTTC CGGGGGCAGC CAGTGACCCA 

GCCCCACCAA TGGGCCTCCA GAGACCCCAG GAACAATAAA ATGTCTTCTC CCACCAGA 



Seq ID NO: 75 Protein sequence? 
Protein Accession # : Eos sequence 



1 11 21 31 41 51 

1 I I I I I 

MSNTQAERSI IGMIDMFHKY TRRDDKIEKP SLLTMMKENF PNFLSACDKK GTNYLADVFE 

KKDKNEDKKI DFSEFLSLLG DIATDYHKQS HGAAPCSGGS Q 



Seq ID NO: 76 DNA sequence 

Nucleic Acid Accession #: Eos sequence 

Coding sequence: 111-416 

1 11 21 31 41 51 

I l I I I l 

GGGAAGAGCC AGGCTGAGCC TTATAAAGGA CTGCTCTTTG TCCAAACACA CACATCTCAC 
TCATCCTTCT ACTCGTGACA CTTCCCAGTT CTGGCTTTTT GAAAGCAAAG ATGAGCAACA 
CTCAAGCTGA GAGGTCCATA ATAGGCATGA TCGACATGTT TCACAAATAC ACCGGACGTG 
ATGGCAAGAT TGAGAAGCCA AGCCTGCTGA CGATGATGAA GGAGAACTTC CCCAATTTCC 
TCAGTG CCTG TGACAAAAAG GGCATACATT ACCTCGCCAC TGTCTTTGAG AAAAAGGACA 
AGAATGAGGA TAAGAAGATT GATTTTTCTG AGTTTCTGTC CTTGCTGGGA GACATAGCCG 
CAGACTACCA CAAGCAGAGC CATGGAGCGG CGCCCTGTTC TGGGGGAAGC CAGTGATCCA 
GCCCCACCAA GGGGCCTCCA GAGACCCCAG GAACAATAAG TGTCTCCTCC CACCAGA 



Seq ID NO: 77 Protein sequence: 
Protein Accession #: XP 048124.1 



1 11 21 31 41 51 

I I I I I I 

MSNTQAERSI IGMIDMFHKY TGRDGKIEKP SLLTMMKENF PNFLSACDKK GIHYLATVFE 

KKDKNEDKKI DFSEFLSLLG DIAADYHKQS HGAAPCSGGS Q 



Seq ID NO: 78 DNA sequence 
Nucleic Acid Accession #; Z73678.1 
Coding sequence: 253-2433 



1 11 

I I 

GGGGTGGTGC AGGGCAGGGG 

CAGAGAGGGA CGAACCAGGG 
CCTCGCACTC TATGGCCGTA 
CGCTGCACCG CACCTCGCCT 
CCTCCCGCCA CCATGAACCA 
GACCAGGACA ACTCCACGTT 
GGCAGGCAGC GCGTGCAGGA 
TCCCAGTCGT CCACCCTGAG 
AATTACAACT ATGGGACCAC 
GGCTCATGGG GATATCCGAT 
TTCAGCTCCT ACAGCCAGAT 
ACCACCGGCG CAGGCAGCGA 
CCCGACCTCT ACTGTGACCC 
CAGAAGACCA CCCAGAACCG 
AAGAAGTGCC CTGTGCGCCC 



21 31 

I I 
TGGTATATCC TGTCTGACGG 

TGGAAGCGCC AGGAGCAGCT 

GGGAGCCGCT GAGAGCGAGA 

CGCCTCTCTG CTCTCCTAGG 

CTCGCCGCTC AAGACCGCCT 

GGCTTTGCCG TCGGACCAAA 

GCAGGTGATG ATGACCGTCA 

CCACTCCAAT CGAGGTTCCA 

CAGCAGGAGC AGCTACTACT 

CTACAATGGA ACCCTCAAGC 

GGAGAACTGG AGCCGGCACT 

CATCTGCTTC ATGCAGAAAA 

ACGGGGCACC CTGCGCAAGG 

CTACAGCTTT TACAGCACCT 

GCCCTCTTGT GCCTCCAAGC 



41 51 

I I 
AGGGCGGGCC TCGCCAGTGC 

GCAGGGAGCC CTCACGCGGA 

AGAGCACGCT CCTGCCCGCC 

CCCCGGCCGC GCGCCACCCG 

TGGCGTACGA ATGCTTCCAG 

AGATGAAAAC AGGCACGTCT 

AGCGGCAGAA GTCCAAGTCT 

TGTATGATGG CTTGGCTGAC 

CCAAGTTCCA GGCAGGGAAT 

GGGAGCCTGA CAACAGGCGC 

ACCCCCGGGG CAGCTGTAAC 

TCAAGGCGAG CCGCAGTGAG 

GCACGCTGGG CAGCAAGGGC 

GCAGTGGTCA GAAGGCCATA 

AGGACCCTGT GTATATCCCG 



217 
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15 
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60 
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70 



75 



WO 02/086443 

CCCATCTCCT GCAACAAGGA 
AGTGAGGACA TCGAGTGCAG 
CAGGATGAGA AGTACCAGGC 
GAAT CTGCCA AGCAACAGGT 
CGCAGCCCCA ACCAGAACGT 
AGGAGCACCA CCAACAAGCT 
CTCCTGAGGA GAACCGGGAA 
CTGTCTTCCA CTGACGAGCT 
GACCGCGTCA TCATTCCCTT 
GTGGTGGACC CTGAGGTCTT 
GATGCAGGCC GCCAGACCAT 
GTCCAGAACT GTGTAGCGGC 
GTTCTGCACA ACCTCTCCTA 
GAGTATAACG CCCGCAACGC 
AGCGACAAGA TGATGAACAA 
AAGGGCAGCG GCTGGTTGTA 
AAGAGCAAGA AAGATGCTAC 
AGCAAGGGGC TGATGTCCAG 
CCACAAATTG CCCGCCTCCT 
CTCCTGAGCA ACATGTCCCG 
CCGGAGGTGA CCAGGCTCCT 
TTGTCCTCGG CCTGCTACAC 
CAGTACTTCT CCAGCAGCAT 
CCCAAGGCCG CAGAAGCTGC 
CAGGGTGTCC TCAGACAGCA 
AACAGCCTCA GGAACTTCAC 
TG C AGGAAGA TATGACCCAG 
CATCCTGTGC AGTATTTGGG 
ATAGTGGAAA GATTTT T AGA 
AGGGAGGTTG GGGCGGGGGG 
TTTCTTCCTC TGAGAAATGG 
GCGTGCATGT GTGTGTGTGT 
TAAGCTATTT TGTTGCAGCT 
TAGGCAAGGA CAACATGTGC 
CAGGGCAAGG GGGCCATCAC 
AGTGGTCTCC AAGGGTGCAG 
GCTTTCCACG AAGGGAGGTC 
ACCCCTCCAG CAGCGCCACA 
AGGACACTCT CGCATACTTT 
GGTGCCTTCC ACCCTCTTGG 
TGCATTCAGA GGTCTTGTAA 
TTAAGAAAAG CTATTTTATT 
TCATATTCCC AGTGGAGAGG 
GTGGGATGGA GTTGGGGTAT 
AGT CAATTG A GGGAGTGTTT 
AGGAAAGGAA AGTGCCATAT 
CCATGCCCCA CTTCCCCTGA 
ATGTGATAAA CAGGGCTATT 
T GAG AC C AG C AGCAGCAGGA 
CCTTGGTGTA CACTAAGACA 
TCTACCTCCA TGCTAGCATT 
TCTCTAGAAG AATATAAGAT 
TCCTCTTCTG CACCACCCCC 
AACACTGATG TGGACT CAGT 
TGTCCTCCGA GAGGTGTCCC 
ATACCCTCCC TTGCTTCTGT 
AGGGACCCAC GTGGGAGCCT 
CTTTGTTGTC ATCAGAACCC 
TCTGTGCGGG GCAGTGTCCT 
CCCGTCCTCA TGCGGCTTAT 
GGGCTCCCCC GGCTGGGGGC 
CATGTGAACC TTACCAGCCC 
GCATCCCCTC GCCTCATGTT 
CCCTGCCCTG GGAACCAGGC 
AGGGCTGACT TTGGTGACAC 
CTGACCCAGG CCTGTCACTT 
AGAACAAGGA GCTTGCCAGG 
ATTGGCCTCA CACTAGCCTA 
TGAGGAAGGA CACAGACTCT 
GTCATTGGCC ACCAGCCACC 
CCTCCTGGGG ACCCAAGAGG 
ACTGGCTGGG AGGACCAAGA 
TGTGAGGGAT CTTGGAGCTT 
AACCTTGTGC CGGCCAGGCC 
GGAAATAGAG AAAATCAATA 



PCT/US02/12476 



CCTGTCCTTT 
TGGGCTGACC 
CATTGGGGCC 
CTATCAGCTG 
CCAGCAGGCC 
GGAGACCCGG 
CGCCGAGATC 
GAAGGAGGAA 
CTCTGGCTGG 
CTTCAATGCC 
GCGTAACTAC 
CAGCCGCTGT 
CCGCCTGGAC 
CTACACCGAG 
CAACTATGAC 
CCATT CAGAT 
CCTGGAGGCC 
TGGCATGAGC 
GCAATCTGGC 
CCACCCTCTG 
CACCAGCCAC 
TGTGAGGAAC 
GCTCAACAAC 
CCGGCTTCTC 
AGGTTTCGAT 
CTCCCGATTC 
CTGAGAAGCC 
AAAGTTCACA 

GGCTTTCTTG 
TATATATATG 
GAGTGTCTTA 
CATAAGGTGG 
TTTTTGGTGA 
TGCAGTCAGG 
GAGTAACTGG 
TGGTGTATCT 
AGGACTGAGG 
GCCAAATGAG 
GCTGTGTGCC 
TCTACTTGTT 
GCAGCTCTTT 
GGAACAAGTG 
AGAAATTAAC 
GGGTCCCAGG 
CAGGGTACCG 
CCCCAGCTGT 
AGGGGTATCA 
GGGCTCCCGA 
GAGCAGAGCC 
GCTGGTGTTA 
GCTCCTCCTC 
GAGTCCAAAC 
ATGACAACTG 
CGGCTGTTAG 
TCACACTGGG 
GGATCCCTGG 
AGAGGAATTC 
AAGCACTTAG 
GTTTTCTGGA 
TGTGCAGTCC 
AGGCGGATGC 
CCTCCCACCT 
AGCCTTCCAG 
TGCCCATTCC 
TGAGAGGGGC 
CTTCATGTAG 
GGCCAATGCC 
GCCCTGGGAT 
TCTGCAGTGG 
CAGTGTTGCT 
CTGCGGCTGG 
CCCTGTAGCC 
CAGTTTCCTT 
AATTGCTAGT 



GGCCACTCTA 

ATCCCCAAGG 

TATTACATCC 

GGAGGCATCT 

GCGGCAGGGG 

AGGCAGAATG 

CAGAAGCAGC 

CTCATTGCCG 

TGCGATGGCA 

ACAGGCTGCT 

TCAGGGCTCA 

GACGACAAGT 

GCCGAGGTGC 

AAGTCCTCCA 

TGCCCCCTGC 

GCCATCCGCA 

TGTGCTGGTG 

CAGTTGATTG 

AACTCTGATG 

CTGCACAGAG 

ACTGGCAATA 

CTGATGGCCT 

ATCATCAACC 

CTGTCTGACA 

AGGAACATGC 

TAAGAAGAGA 

CTCAGGCCTC 

AGAAACTGAG 

CCTTGGGGAA 

AGTTAAAGGG 

TGTCTAATGT 

AAGCATAACC 

TGAAAAGGAC 

GCTGCTCATA 

CCCTCAGAGG 

GGCTGGGCCA 

CATGGGAGAA 

TTGGGTAGGT 

GCCTGCTCAG 

CATCAGAGCA 

GCAGGAGAAA 

CCCAAGAGCT 

GGGCTGGGCA 

CAGGAAGATG 

AGACTTGGAC 

GTACCGGCAA 

CTTGTCTCCA 

GCCACGT CGA 

GGGCCTTATG 

CAGCGCTCCC 

GAGAGGAATT 

CTCACCCCTT 

CCACCTCTTG 

AGATGGGGGA 

CCAGCTGTGC 

AGGCCCACTC 

ACTGTCCTGG 

TTCTCCTAAA 

ACTA CAT CAG 

GGAAAGTGGA 

GGTCAGGGCG 

CCCTTCCCCT 

TCAAAGAATG 

ACCTCAGGGG 

CTCTCAGGCC 

AAAACTGAGA 

CCGACACACG 

CAAAATAAGG 

CTCCTGTGCT 

GGACCACACT 

GTCTGCGTGT 

GGTGGGCAGG 

CACCTTCCCC 

GTGTGATACA 

GTTTCTTTGA 



GGGCCAGCTC 

CTGTGCAGTA 

AGCATACCTG 

GCAAGCTGGT 

CCCTGCGCAA 

GGATCCGCGA 

TGACTGGGCT 

ACGCCCTGCC 

ATAGCAACAT 

TGAGGAACCT 

TTGATTCCCT 

CTGTGGAAAA 

CCACCCGCTA 

CTGGCTGCTT 

CTGAGGAAGA 

CCTACCTGAA 

CCCTGCAGAA 

GGCTGAAGGA 

TGGTGCGGTC 

TGATGGGGAA 

CCAGCAACTC 

CGCAGCCACA 

TGTGCCGAAG 

TGTGGTCCAG 

TGGGAACCTT 

CTGTCCAAGC 

GCTGGATGGG 

AAGAAACCTA 

ACTGGCAGGC 

GCTTATATGT 

AAGTGTGTGC 

ACAAACTGCA 

TCTCCTGTGT 

ATTCCTGAAA 

AGTCCTGCAG 

GCCTCCCCCC 

TCTGGGGTGT 

GTGAGGTTCC 

AGGAGTAGGA 

GGCTCAGCCT 

GAAGGTAAAA 

GTTCTGGGAA 

TATACCTATT 

TTTCCACCAA 

GGGGGGAGTT 

GCTCACATCT 

CTCTGTGAAA 

GCCCCCAGAC 

AGAAAACCTG 

AAGCCTTCCT 

AACTTCCTGG 

CTCAGCCTCC 

CCCCAGCATT 

AGCCAGACAT 

TGTGGTGCTG 

CTGGCTCACC 

GCATAGGTTT 

AAATACGTAT 

GGAAGAACAC 

GACACAAGTC 

GGAGGGGAAA 

TAGCACTACC 

AAGAGCCCCA 

CTGAGGCAGA 

AGCTCAGGTC 

GGGGCTTTTC 

TCTCAGGATT 

AGTTCCAATT 

AGCGGCCAAT 

AGCAGCCCTG 

CCACCTTGGA 

GAAGGGAAGC 

TTGCTTCATG 

CTAATGTATT 

AAAAAAAAA 



CAAGATCTGC 960 

CCTGAGCTCC 102 0 

CTTCCAGGAT 1080 

GGACCTCCTC 1140 

CCTGGTGTTC 12 00 

GGCAGTCAGC 1260 

GCTCTGGAAC 1320 

TGTTCTGGCC 1380 

GTCCCGGGAA 1440 

GAGCTCGGCC 1500 

CATGGCCTAT 1560 

CTGCATGTGT 162 0 

CCGCCAGCTG 1680 

CAGCAACAAG 1740 

GACCAACCCC 1800 

CCTCATGGGC 1860 

CCTGACAGCC 1920 

AAAGGGCCTG 1980 

CGGAGCCTCC 2040 

CCAGGTGTTC 2100 

CGAAGACATC 2160 

ACTGGCCAAG 222 0 

CAGTGCCTCA 22 80 

CAAGGAACTG 2 340 

AGCTGGGGCC 240 0 

AAGTTAGGCT 2460 

GTTTTCTGTC 2520 

AAAACTGTGG 2580 

AATGGGGGTT 2640 

GATGTCAATA 2700 

ATGCATGTGC 2760 

AAAAGCTAGG 2 820 

TTCTTACTCA 2 880 

TGTGTGGTGC 2 940 

GCTTCCTACC 3 000 

TTACAAGGCT 3 0 60 

CTGTAGTGTC 312 0 

AGAGGACAGC 3180 

GCTGAAAGAT 3240 

GCAAAGGCCC 3 3 00 

AATGATTTTT 33 60 

TGGCTGGTCT 342 0 

CCGGCTTCTA 3480 

GCCTGCTGTG 3540 

TGGGTAGACT 3 60 0 

CAGCCAGGGG 3 660 

CCCACAGGGG 3720 

TCTGTGCACT 3 780 

TGTGGACATC 3 840 

CCTTCCAGCT 3 90 0 

TCTGTGCCCT 3 960 

TCCCAAGTCT 4020 

CAGGCTGGAA 40 80 

GTGAGGACGC 4140 

TGGGTCTGTC 42 00 

TCTCCCTCTC 42 60 

CAGGGGCCTC 432 0 

GGCATACCAA 43 80 

AGACCACATC 4440 

CTTGGCTTTA 450 0 

TGCACCGCTG 4560 

CTGGCCTCCT 4620 

TGGGCCCAGC 4680 

CTATTAGGGC 4740 

ACCCGGGCCT 4800 

CTAGAGAAAG 4860 

TTAAGT CCAC 4 92 0 

TGGGG C C AAA 4980 

GACAAATCCA 5040 

ACTCCACACT 5100 

ATCTGGCTGA 5160 

CGGGGGCTGC 5220 

TTTGTAGAGG 5280 

TGCTTTTTTT 5340 



80 



85 



Seq ID NO: 79 Protein sequence: 
Protein Accession #: CAA98022.1 



1 11 

1 1 
MNHSPLKTAL AYECFQDQDN 

TLSHSNRGSM YDGLADNYNY 

SQMENWSRHY PRGSCNTTGA 

QNRYSFYSTC SGQKAIKKCP 

ECSGLTIPKA VQYLSSQDEK 

QNVQQAAAGA LRNLVFRSTT 



21 



STIALPSDQK 
GTTSRSSYYS 
GSDICFMQKI 
VRPPSCASKQ 
YQAIGAYYIQ 
NKLETRRQNG 



31 
I 

MKTGTSGRQR 
KFQAGNGSWG 
KASRSEPDLY 
DPVYIPPISC 
HTCFQDESAK 
IREAVSLLRR 



41 
I 

VQEQVMMTVK 
YPIYNGTLKR 
CDPRGTLRKG 
NKDLSFGHSR 
QQVYQLGGIC 
TGNAEIQKQL 



51 
I 

RQKSKSSQSS 60 

EPDNRRFSSY 12 0 

TLGSKGQKTT 180 

ASSKICSEDI 240 

KLVDLLRSPN 300 

TGLLWNLSST 3 60 



218 



WO 02/086443 

DELKEELIAD ALPVLADRVI 
QTMRNYSGLI DSLMAYVQNC 
RNAYTEKS ST GCFSNKSDKM 
DATLEACAGA LQNLTASKGL 
MSRHPLLHRV MGNQVFPEVT 
SSMLNNIINL CRSSASPKAA 
NFTSRF 



PCT/US02/12476 



IPFSGWCDGN 
VAASRCDDKS 
MNNNYDCPLP 
MSSGMSQLIG 
RLLTSHTGNT 
EAARLLLSDM 



SNMSREWDP 
VENCMCVLHN 
EEETNPKGSG 
LKEKGLPQIA 
SNSEDILSSA 
WSSKELQGVL 



EVFFNATGCL 
LSYRLDAEVP 
WIi YHSDA I RT 
RLLQSGNSDV 
CYTVRNLMAS 
RQQGFDRNML 



RNLSSADAGR 420 

TRYRQLEYNA 480 

YLNLMGKSKK 540 

VRSGASLLSN 600 

QPQLAKQYFS 660 

GTLAGANSLR 720 



10 



Seq ID NO: 80 DNA sequence 

Nucleic Acid Accession #: NM_006516.1 

Coding sequence : 180-1658 



15 



20 



25 



30 



35 



40 



45 



50 



55 



60 



TAGTCGCGGG 
GTCAGAGTCG 
CGCACGCCCG 
TGGAGCCCAG 
TTGGCTCCCT 
AGGAGTT CTA 
TCACCACGCT 
TCTCTGTGGG 
TGCTGGCCTT 
TGCTGATCCT 
CCATGTATGT 
AGCTGGGCAT 
GCAACAAGGA 
GCATCGTGCT 
AGAACCGGGC 
TGCAGGAGAT 
AGCTGTTCCG 
CCCAGCAGCT 
CGGGGGTGCA 
CTGTCGTGTC 
TCGCTGGCAT 
TACCCTGGAT 
TGGGTCCTGG 
CAGCTGCCAT 
GCTTCCAGTA 
TGGTTCTGTT 
ATGAGATCGC 
AGCTGTTCCA 
GCCTGCTCCC 
AACCTGACAG 
CCAGAAGAAT 
AAATCTATTC 
ATATCAGCCT 
GAGGGTGGAG 
CTGGACCTAT 
GAGGTGGCTA 
CATTAGGATT 
CCTGAGACCA 
GCCGGGTTCT 
GGGAGCCTGC 
TGCAAGATAT 
ATATCTGGAC 
TATAAATGGC 
TTTGGATGGG 
GACT CAGGAT 
TTTGATCCCT 
ATCACATATT 
AGGCTTGAAA 



11 
I 

TCCCCGAGTG 
CAGTGGGAGT 
TCGCCACCCG 
CAGCAAGAAG 
GCAGTTTGGC 
CAACCAGACA 
CTGGTCCCTC 
CCTTTTCGTT 
CGTGTCCGCC 
GGGCCGCTTC 
GGGTGAAGTG 
CGTCGTCGGC 
CCTGTGGCCC 
GCCCTTCTGC 
CAAGAGTGTG 
GAAGGAAGAG 
CTCCCCCGCC 
GTCTGGCATC 
GCAGCCTGTG 
GCTGTTTGTG 
GGCGGGTTGT 
GTCCTATCTG 
CCCCATCCCA 
TGCCGTTGCA 
TGTGGAGCAA 
CTTCATCTTC 
TTCCGGCTTC 
TCCCCTGGGG 
AGCAGCCCTA 
ATGTCAGCCG 
ATTCAGGACT 
AGACAAGCAA 
GAGTCTCCTG 
ACTAAGCCCT 
GTCCTAAGGA 
TGGCCACCCG 
TGCCCCTTCC 
GTTGGGAGCA 
AGTCTCCTTT 
AAACTCACTG 
TTATATATAT 
AAGCCAACTT 
TGGTTTTTAG 
AGTGAGACAG 
CCAGTCCCTT 
GTTACCCAGA 
TGATAGTTGG 
TCGCATTATT 



21 
I 

AGCACGCCAG 
CCCCGGACCG 
CGTACCCGGC 
CTGACGGGTC 
TACAACACTG 
TGGGTCCACC 
TCAGTGGCCA 
AACCGCTTTG 
GTGCTCATGG 
ATCATCGGTG 
TCACCCACAG 
ATCCTCATCG 
CTGCTGCTGA 
CCCGAGAGTC 
CTAAAGAAGC 
AGTCGGCAGA 
TACCGCCAGC 
AACGCTGTCT 
TATGCCACCA 
GTGGAGCGAG 
GCCATACTCA 
AGCATCGTGG 
TGGTTCATCG 
GGCTTCTCCA 
CTGTGTGGTC 
ACCTACTTCA 
CGGCAGGGGG 
GCTGATTCCC 
AGGATCTCTC 
AGCCGGGCCT 
TAACGGCTCC 
CAGGTTTTAT 
TGCCCACATC 
GTCGAGACAC 
CACACTAATC 
TTCTGCTGGC 
CATCTCTTCC 
CTGGAGTGCA 
GCACTGAGGG 
CTCAAGAAGA 
TTTTGGTTGT 
GTAAATACAC 
AAACATGGTT 
AAGTAAGTGG 
ACACGTACCT 
GAATATATAC 
TGTTCAAAAA 
TTGAATGTGA 



31 
I 

GGAGCAGGAG 
GAGCACGAGC 
GCAGCCAGAG 
GCCTCATGCT 
G AGT CAT CAA 
GCTATGGGGA 
TCTTTTCTGT 
GCCGGCGGAA 
GCTTCTCGAA 
TGTACTGCGG 
CCTTTCGTGG 
CCCAGGTGTT 
GCATCATCTT 
CCCGCTTCCT 
TGCGCGGGAC 
TGATGCGGGA 
CCATCCTCAT 
TCTATTACTC 
TTGGCTCCGG 
CAGGCCGGCG 
TGACCATCGC 
CCATCTTTGG 
TGGCTGAACT 
ACTGGACCTC 
CCTACGTCTT 
AAGTTCCTGA 
GAGCCAGCCA 
AAGTGTGAGT 
AGGAG CACAG 
GGGGCTCCTT 
AGGATTTTAA 
AATTTTTTTA 
CCAGGCTTCA 
TTGCCTTCTT 
GAACTATGAA 
CTGGATCTCC 
TACCCAACCA 
GGGAGGAGAG 
CCACACTATT 
CATGGAGACT 
CAATATTAAA 
CACCTCACTC 
TTGAAATGCT 
GGT TGCAACC 
CTCATCAGTG 
ATTCTTTATC 
AACACTAGTT 
AGGGAA 



41 

1 

ACCAAACGAC 
CTGAGCGGGA 
CCACCAGCGC 
GGCTGTGGGA 
TGCCCCCCAG 
GAGCATCCTG 
TGGGGGCATG 
TTCAATGCTG 
ACTGGGCAAG 
CCTGACCACA 
GGCCCTGGGC 
CGGCCTGGAC 
CATCCCGGCC 
GCTCATCAAC 
AGCTGACGTG 
GAAGAAGGTC 
CGCTGTGGTG 
CACGAGCATC 
TATCGTCAAC 
GACCCTGCAC 
GCTAGCACTG 
CTTTGTGGCC 
CTTCAGCCAG 
AAATTTCATT 
CATCATCTTC 
GACTAAAGGC 
AAGTGATAAG 
CGCCCCAGAT 
GCAGCTGGAT 
TCTCCAGCCA 
CAAAAGCAAG 
TTACTGATTT 
CCCTGAATGG 
CACCCAGCTA 
CTACAAAGCT 
CCACTCTAGG 
CTCAAATTAA 
GGGAAGGGCC 
ACCATGAGAA 
CCTGCCCTGT 
TACAGACACT 
CTGTTACTTA 
TGTGGATTGA 
ACTGCAACGG 
TCCTCTTGCT 
TTGACATTCA 
TTGTGCCAGC 



51 

I 

GGGGGTCGGA 60 

GAGCGCCGCT 120 

AGCGCTGCCA 180 

GGAGCAGTGC 240 

AAGGTGATCG 300 

CCCACCACGC 360 

ATTGGCTCCT 420 

ATGATGAACC 480 

TCCTTTGAGA 540 

GGCTTCGTGC 600 

ACCCTGCACC 660 

TCCATCATGG 72 0 

CTGCTGCAGT 780 

CGCAACGAGG 840 

ACCCATGACC 900 

ACCATCCTGG 960 

CTGCAGCTGT 1020 

TTCGAGAAGG 1080 

ACGGCCTTCA 1140 

CTCATAGGCC 1200 

CTGGAGCAGC 12 60 

TTCTTTGAAG 13 2 0 

GGTCCACGTC 1380 

GTGGGCATGT 1440 

ACTGTGCTCC 1500 

CGGACCTTCG 1560 

ACACCCGAGG 1620 

CACCAGCCCG 1680 

GAGACTTCCA 1740 

GCAATGATGT 1800 

ACTGTTGCTC 1860 

TGTTATTTTT 1920 

TTCCATGCCT 1980 

AT CTGTAGGG 2 040 

TCTATCCCAG 2100 

GGTCAGGCTC 2160 

TCTTTCTTTA 2220 

AGTCTGGGCT 2280 

GAGGGCCTGT 2340 

TGTGTATAGA 2400 

AAGTTATAGT 2460 

CCTAAACAGA 2520 

GGGTAGGAGG 2580 

CTTAGACTTC 2640 

CAAAAATCTG 2700 

AGGCATTTCT 2760 

CGTGATGCTC 2 82 0 



65 



Seq ID NO: 81 Protein sequence: 
Protein Accession #: NP 006507.1 



70 



75 



80 



85 



MEPSSKKLTG 
LTTLWSLSVA 
MLILGRFIIG 
GNKDLWPLLL 
LQEMKEESRQ 
AGVQQPVYAT 
LPWMSYLSIV 
CFQYVEQLCG 
ELFHPLGADS 



11 
I 

RLMIiAVGGAV 
IFSVGGMIGS 
VYCGLTTGFV 
SIIFIPALLQ 
MMREKKVTIL 
IGSGIVNTAF 
AIFGFVAFFE 
PYVFIIFTVL 
QV 



21 

I 

LGSLQFGYNT 
FSVGLFVNRF 
PMYVGEVSPT 
CIVLPFCPES 
ELFRSPAYRQ 
TWSLFWER 
VGPGPIPWFI 
LVLFFIFTYF 



31 

I 

GVINAPQKVI 
GRRNSMLMMN 
AFRGALGTLH 
PRFLLINRNE 
PILIAWLQL 
AGRRTLHLIG 
VAELFSQGPR 
KVPETKGRTF 



41 

I 

EEFYNQTWVH 
LLAFVSAVLM 
QLGIWGILI 
ENRAKSVLKK 
SQQLSGINAV 
LAGMAGCAIL 
PAAIAVAGFS 
DEIASGFRQG 



51 

I 

RYGESILPTT 
GFSKLGKSFE 
AQVFGLDSIM 
LRGTADVTHD 
FYYSTSIFEK 
MTIALALLEQ 
NWTSNFIVGM 
GASQSDKTPE 



Seq ID NO: 82 DNA sequence 
Nucleic Acid Accession #: BC001291 
Coding sequence: 44-541 

1 11 21 31 41 51 

l l l I l I 

GGGGGCGCCG CGCGCTGACC CTCCCTGGGC ACCGCTGGGG ACGATGGCGC TGCTCGCCTT 
GCTGCTGGTC GTGGCCCTAC CGCGGGTGTG GACAGACGCC AACCTGACTG CGAGACAACG 



60 
120 
180 
240 
300 
360 
420 
480 



60 
12 0 



219 



10 



15 



20 



WO 02/086443 

AGATCCAGAG GACTCCCAGC 
TGAGAGAGAA AACACTTTCG 
CTGCGTTATA GCGGCCGTGA 
CGCTGGTTGT GCAGCGATGG 
GCCCATGCCC TTCTTTTACC 
ACCTATCAAC TCATCAGTGT 
GCTGTGGCTG GCCATCCTCC 
AGCCACGGGA CTGCCACAGA 
ACCTGTTGCA TTAAACTTGT 
GGGATGGGAG AGTGGGGATC 
ACATTCAGAG GAAGTCCAGA 
AAATCAAACC TTGTAACTCA 
CCTCTGAGGG CTTCAGTATT 
TGCTGAGATG CTTCCGACCT 
GGGTGAAGAC ATCCCTGGAG 
AGGGCTGCCC CCATTCCAGT 
CTACCAGATT CCAGGAGGCA 
ACCAGCTGGC ACAGGTGCAC 
ACTTAGGCCA AGTAGAGAGC 
CATCCATGGG GAGCTGAGAA 
TTCAAAAGTT CACGAAAAAA 



PCT/US02/12476 



GAACGGACGA 
AGTGCCAGAA 
AAATATTTCC 
AGAGACCCAA 
TCAAGTGTTG 
TCAAAGAATA 
TGCTGCTGGC 
CTGAGCCTTC 
TTTCTGTTGA 
AGGTGCAGTT 
TCTCCTGAGT 
TTTATTGCTG 
GATGGGGAGG 
TTCAGGTGAC 
TGAAGGACTC 
GGTGGAGGCG 
GAAGATAACT 
AGATTCATAA 
ATCAGGGTAA 
ATCAGACTCA 
AAAAAAAAAA 



GGGTGACAAT 
CCCAAGGAGG 
ACGTTTTTTC 
GCCAGAGGAG 
TAAAATTCGC 
TGCTGGGAGC 
CTCCATTGCA 
CGGAGCATGG 
TTACCTCTTG 
GGCTCTTAAC 
AGTGATTTTG 
ATGGCCACTC 
GAGGCCTAAG 
GCAGGAACAC 
CTCAGCATGG 
CTGTGGATGG 
AATTGTGTTG 
ATTCCCACAC 
ATGGCGTTCA 
AAGTTCCACC 
AAAAAAAAAA 



AGAGTGTGGT 
TGCAAATGGA 
ATGGTTGCGA 
AAGCGGTTTC 
TACTGCAATT 
ATGGGTGAGA 
GCCGGCCTCA 
ACTCGCTCCA 
GTTTGACTTC 
CCTCAAGGGT 
GTGACAAGTT 
TTTTCCTTGA 
TACCACTCAT 
TGGGGGAGTC 
GGGGCAGTGG 
CTGCTTTTCC 
AAGAAACTTA 
GTGTGTGTTC 
TTTCTCTGTT 
AAAAACAAAT 
AAAAAAAAAA 



GTCATGTTTG 180 

CAGAGCCATA 240 

AGCAGTGCTC 300 

TCCTGGAAGA 360 

TAGAGGGGCC 420 

GCTGTGGTGG 480 

GCCTGTCTTG 540 

GACCGTTGTC 600 

CCAGGGTCTT 660 

TCTTTAACTC 720 

TTTCTCTTTG 780 

CTCCCCTCTG 840 

GGAGAGTATG 900 

TGAATGATTG 960 

GGCACACGTT 102 0 

TCAACCTTTC 1080 

GACTTCACCC 1140 

AACAT CTGAA 1200 

AAGATGCAGC 1260 

ACAAGGGGAC 1320 
AAA 



25 



30 



Seq ID NO: 83 Protein sequence: 
Protein Accession #: AAH01291 



11 



21 



31 



51 



41 

.1 1 I I 

MALLALLLW ALPRVWTDAN LTARQRDPED SQRTDEGDNR VWCHVCEREN TFECQNPRRC 
KWTEPYCVIA AVKIFPRFFM VAKQCSAGCA AMERPKPEEK RFLLEEPMPF FYLKCCKIRY 
CNLEGPPINS SVFKEYAGSM GESCGGLWLA ILLLLASIAA GLSLS 



60 
120 



35 



Seq ID NO: 84 DNA sequence 

Nucleic Acid Accession #: NM_022 893 . 1 

Coding sequence: 229-2726 



11 



40 



45 



50 



55 



60 
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70 



75 



80 



85 



*r^r ^ni^ 

TGCGCCATCT 
TTTTCTCTGG 
CGCCCGCCGC 
AAGCAAGGCA 
ATTCTTACAG 
CTCCTCACCT 
GAGCACAAAC 
CCTTCCCCTT 
GTCACG CCAG 
GAACACATAG 
GGAGCTCTAA 
GATGAGCCCA 
CTCTTGCAAC 
AGTCCCCTGA 
CCACCTCTCC 
GGATCAGTAT 
CTGTTTAGTC 
GAAGAAATGG 
CCAATGGCTA 
AACACGTCTA 
CCATTCCAGC 
TCCGGCCCTC 
ACGTTCAAAT 
TACAAGTGCA 
AAGACGCACA 
GCCAGCTCCC 
TCCGTGGTGG 
GAGGAGGAAG 
CTGACGGAGA 
CACGAGAACA 
GACGTCATGC 
GTCCTGGGCG 
TGCGACGAAG 
CGCGGCTGCT 
AGCCCCAGCT 
CCCCCGGCCA 
GCCTCCAGGC 
GCCTCCTCGT 
GAGCTGGACG 
ATTAGTGGTC 
GAGTACTGTG 
ACGGGCGAAA 
CTCACCAGGC 
TGTAAGATGC 
GATCGAGTGT 
CTCCCACCTG 
CCTGTAGGAT 
ACGAAGCTAA 
TTCTTTTTTC 



TTTTTTGCTT 
TTGTATTATT 
AGTCTCCTTC 
CGCCGCCGCC 
AACCCCAGCA 
ATGATGAACC 
GTGGGCAGTG 
GGAAACAATG 
CACCAATCGA 
AAGATGACGA 
CAGATAAACT 
TCCCCACGCC 
GCAGCTACAC 
ACGCACAGAA 
CCCCGCGGGT 
ATGGGATTCA 
CGAGAGAGGC 
CACCACCGAG 
CCCTGGCCAC 
TGGAGCCTCC 
GCCCACCGCT 
CAGGTAGCAA 
CTCCCTCCCA 
TTCAGAGCAA 
ACCTGTGCGA 
TGCACAAATC 
CGGAACCCGG 
CCAAGTTCAA 
AGGAGGACGA 
GCGAGAGGGT 
GCT CGCGGGG 
AGGGCATGGT 
AGAAGCATAA 
ACTCGGTGGC 
CCCCGGGCGA 
CGCTGAGCCC 
CGATGCCCAA 
AGCTCAAAGA 
CGGAGCACTC 
GAGGGATCTC 
CGGGCACGGG 
GGAAAGTCTT 
GGCCTTATAA 
ACATGAAAAC 
CTTTTAGCGT 
TGAATAATGA 
ACACCCCCTT 
TTTTTTCTAG 
GAATATGAGA 
TTTTTCCTTT 



21 
I 

AAAAAAAAGC 
TCTAATTTAT 
TTTCTAACCC 
GCCGCCGCCG 
CTTAAGCAAA 
AGACCACGGC 
CCAGATGAAC 
CAATGGCAGC 
GATGAAAAAA 
TTGTTTATCA 
TCTGCACTGG 
TGGGATGAGT 
ATGTACAACT 
CACTCATGGA 
TGGTATCCCT 
TATTGCAGAC 
TTCCGGCCTG 
ACATCACTTG 
CCATCACCCG 
CGCCATGGAT 
GTCCCCAGGG 
GCCGCCCTTC 
GCCCCCGGTC 
CCTGGTGGTG 
CCACGCGTGC 
GTCCCCCATG 
CACCAGCGAC 
GAGCGAGAAC 
CGAGGAAGAG 
GGACTACGGC 
CGCGGTCGTG 
GCTCAGCTCC 
GCGCGGCCAC 
CGGCGAGTCG 
GTCGGCCTCG 
CTTCTCTAAG 
CACGGAGAAC 
TCCCTTCCTT 
CTCGGAGAAC 
GGGGCGCAGC 
CAGGCCCAGC 
CAAGAACTGT 
ATGCGAGCTG 
GCATGGCCAG 
GTACAGTACC 
TATAAAAACT 
TTT CACCAGT 
TCCCATGTGA 
GTGCTTGTCA 
T T T T T 



31 

1 

CATGACGGCT 
TTTGGATGTC 
GGCTCTCCCG 
CCCGCCCCGC 
CGGGAATTCT 
CCGTTGGGAG 
TTCCCATTGG 
CTCTGCTTAG 
GCATCCAATC 
ACGTCAT CT A 
AGGGGCCTCT 
GCAGAATATG 
TGCAAACAGC 
TTAAGAATCT 
TCAGGACTAG 
AATAACCCCT 
GCAGAAGGGC 
GACCCCCACC 
AGTGCCTTTG 
TTCTCTAGGA 
CGGCCCAGCC 
CTGGCGACGC 
AAGTCCAAGT 
CACCGGCGCA 
ACCCAGGCCA 
ACGGTCAAGT 
TTGGTGGGCA 
GACCCCAACC 
GAAGAAGAGG 
TTCGGGCTGA 
GGCGTGGGCG 
ATGCAGCACT 
CTGGCCGAGG 
GACCGCATAG 
GGGGGCCTGT 
CGCATCAAGC 
GTGTACT CGC 
AGCTTCGGAG 
GGGAGCTTGC 
GGCACGGGAA 
TCAAAAGAGG 
AGCAATCTCA 
TGCAACTATG 
GTGGGGAAGG 
CTGGAGAAAC 
GAATAGAGGT 
CCCTTTCCCC 
TTTAAACAAA 
CCAGCACACC 
TCCTTTATGT 



41 
I 

CTCCCACAAT 
AAAAGGCACT 
ATGTGAACCG 
AGCCCACCAT 
CGCCCGAGGC 
CTCCAGAAGG 
GGGACATTCT 
AAAAAGCTGT 
CCGTGGAGGT 
GAAGAATTTG 
CCTCCCCTCG 
CCCCGCAGGG 
CATTCACCAG 
ACTTAGAAAG 
GTGCAGAATG 
TTAACCTGCT 
GCTTTCCACC 
GCATAGAGCG 
ACAGGGTGCT 
GACTTAGAGA 
CTATGCAAAG 
CCCCCCTCCC 
CATGCGAGTT 
GCCACACGGG 
GCAAGCTGAA 
CCGACGACGG 
GCGCCAGCAG 
TGATCCCGGA 
AGGAAGAGGA 
GCCTGGAGGC 
ACGAGAGCCG 
TCAGCGAGGC 
CCGAGGGCCA 
ACGATGGCAC 
CCAAAAAGCT 
TCGAGAAGGA 
AGTGGCTCGC 
ACTCCAGACA 
GCTTCTCCAC 
GTGGAGGGAG 
GCAGACGCAG 
CTGTCCACAG 
CCTGTGCCCA 
ACGTTTACAA 
ACATGAAAAA 
ATATTAATAC 
ATCGCCCTCC 
CAAACAAACA 
TGTTTTTTTT 
TCTCACCGTT 



51 
I 

TCATCTTCCC 60 

GATGAAGATA 120 

AGCCGTCGTC 180 

GTCTCGCCGC 240 

TCTTGAAGCC 300 

GGAT CATGAC 360 

TATTTTTATC 420 

GGATAAGCCA 480 

TGGCATCCAG 540 

CCCCAAACAG 600 

TTCTGCACAT 660 

TATTTGTAAA 720 

TGCATGGTTT 780 

CGAACACGGA 840 

TCCTTCCCAG 90 0 

AAGAATACCA 960 

CACTCCCCCC 1020 

CCTGGGGGCG 1080 

GCGGTTGAAT 1140 

GCTGGCAGGG 1200 

GTTACTGCAA 12 60 

TCCTCTGCAA 1320 

CTGCGGCAAG 1380 

CGAGAAGCCC 1440 

GCGCCACATG 1500 

TCTCTCCACC 1560 

CGCGCTCAAG 1620 

GAACGGGGAC 1680 

GGAGGAGGAG 1740 

GGCGCGCCAC 1800 

CGCCCTGCCC 1860 

CTTCCACCAG 1920 

CAGGGACACT 1980 

TGTTAATGGC 2040 

GCTGCTGGGC 2100 

GTTCGACCTG 2160 

CGGCTACGCG 2220 

ATCGCCTTTT 22 80 

ACCGCCCGGG 2340 

CACGCCCCAT 2400 

CGACACT TGT 2460 

GAGAAGCCAC 2520 

GAGTAGCAAG 2580 

ATGTGAAATT 2640 

ATGGCACAGT 2700 

CCCTCCCTCA 2760 

AGCCCCACTC 2 82 0 

AACAGAAGTA 2880 

CTTTTTCTTT 2 940 

TGAATGCATG 3000 
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ATCTGTATGG GGCAATACTA TTGCATTTTA CGCAAACTTT GAGCCTTTCT CTTGTG CAAT 3060 

AATTTACATG TTGTGTATGT TTTTTTTTAA ACTTAGACAG CATGTATGGT ATGTTATGGC 312 0 

TATTTTAAAT TGTCCCTAAT TCGTTGCTGA GCAAACATGT TGCTGTTTCC AGTTCCGTTC 3180 

TGAGAGAAAA AGAGAGAGAG AGAGAAAAAG ACCATGCTGC ATACATT CTG TAATACATAT 3240 

5 CATGTACAGT TTTATTTTAT AACGTGAGGA GGAAAAACAG TCTTTGGATT AACCCTCTAT 33 00 

AGACAGAATA GATAGCACTG AAAAAAAATC TCTATGAGCT AAATGTCTGT CTCTAAAGGG 33 60 

TTAAATGTAT CAATTGGAAA GGAAGAAAAA AGGCCTTGAA TTGACAAATT AACAGAAAAA 3420 

CAGAACAAGT TTATTCTATC ATTTGGTTTT AAAATATGAG TGCCTTGGAT CTATTAAAAC 3480 

CACAT CGATG GTTCTTTCTA CTTGTTATAA ACTTGTAGCT TAATTCAGCA TTGGGTGAGG 3540 

10 TAATAAACCT TAGGAACTAG CATATAATTC TATATTGTAT TTCTCACAAC AATGGCTACC 3600 

TAAAAAGATG ACCCATTATG TCCTAGTTAA TCATCATTTT TCCTTTAGTT TAATTTTATA 3660 

AACAAAACTG ATTATACCAG TATAAAAGCT ACTTTGCTCC TGGTGAGAGC TTAAAAGAAA 3720 

TGGGCTGTTT TGCCCAAAGT TTTATTTTTT TTAAACAATG ATTAAATTGA ATGTGTAATG 3780 

TGCAAAAGCC CTGGAACGCA ATTAAATACA CTAGTAAGGA GTTCATTTTA TGAAGATATT 3840 

15 TGCTTTAATA ATGTCTTTTT AAAAATACTG GCACCAAAAG AAATAGATCC AGATCTACTT 3900 

GGTTGTCAAG TGGACAATCA AATGATAAAC TTTAAGACCT TGTATACCAT ATTGAAAGGA 3 960 

AGAGGCTGAC AATAAGGTTT GACAGAGGGG AACAGAAGAA AATAATATGA TTTATTAGCA 4020 

CAACGTGGTA CTATTTGCCA TTTAAAACTA GAACAGGTAT ATAAGCTAAT ATTGATACAA 4080 

TGATGATTAA CTATGAATTC TTAAGACTTG CATTTAAATG TGACATTCTT AAAAAAAGAA 4140 

20 GAGAAAGAAT TTTAAGAGTA GCAGTATATA TGTCTGTGCT CCCTAAAAGT TGTACTTCAT 4200 

TTCTTTTCCA TACACTGTGT GCTATTTGTG TTAACATGGA AGAGGATTCA TTGTTTTTAT 4260 

TTTTATTTTT TTAATTTTTT CTTTTTTATT AAGCTAGCAT CTGCCCCAGT TGGTGTTCAA 4320 

ATAGCACTTG ACTCTGCCTG TGATATCTGT ATCTTTTCTC TAATCAGAGA TACAGAGGTT 4380 

GAGTATAAAA TAAACCTGCT CAGATAGGAC AATTAAGTGC ACTGTACAAT TTTCCCAGTT 4440 

25 TACAGGTCTA TACTTAAGGG AAAAGT TGCA AGAATGCTGA AAAAAAATTG AACACAATCT 4500 

CATTGAGGAG CATTTTTTAA AAACTAAAAA AAAAAAAACT TTGCCAGCCA TTTACTTGAC 4560 

TATTGAGCTT ACTTACTTGG ACGCAACATT GCAAGCGCTG TGAATGGAAA CAGAATACAC 4620 

TTAACATAGA AATGAATGAT TGCTTTCGCT TCTACAGTGC AAGGATTTTT TTGTACAAAA 4680 

CTTTTTTAAA TATAAATGTT AAGAAAAATT TTTTTTAAAA AACACTTCAT TATGTTTAGG 4740 

30 GGGGAACTGC ATTTTAGGGT TCCATTGTCT TGGTGGTGTT ACAAGACTTG TTATCCATTT 4800 

AAAAATGGTA GTGGAAATTC TATGCCTTGG ATACACACCG CTCTTCAGGT TGTAAAAAAA 4860 

AAAAACATAC ATTGGGGAAA GGTTTAAGAT TATATAGTAC TTAAATATAG GAAAATGCAC 4920 

ACTCATGTTG ATTCCTATGC TAAAATACAT TTATGGTCTT TTTTCTGTAT TTCTAGAATG 4980 

GTATTTGAAT TAAATGTTCA TCTAGTGTTA GGCACTATAG TATTTATATT GAAGCTTGTA 5040 

35 TTTTTAACTG TTGCTTGTTC TCTTAAAAGG TATCAATGTA CCTTTTTTGG TAGTGGAAAA 5100 

AAAAAAGACA GGCTGCCACA GTATATTTTT TTAATTTGGC AGGATAATAT AGTGCAAATT 5160 

ATTTGTATGC TTCAAAAAAA AAAAAAAGAG AGAAACAAAA AAGTGTGACA TTACAGATGA 5220 

GAAGCCATAT AATGGCGGTT TGGGGGAGCC TGCTAGAATG TCACATGGAT GGCTGTCATA 52 80 

GGGGTTGTAC ATATCCTTTT TTGTTCCTTT TTCCTGCTGC CATACTGTAT GCAGTACTGC 5340 

40 AAGCTAATAA CGTTGGTTTG TTATGTAGTG TGCTTTTTGT CCCTTTCCTT CTATCACCCT 54 0 0 

ACATTCCAGC ATCTTACCTT CATATGCAGT AAAAGAAAGA AAGAAAAAAA AAGGAAAAAA 5460 

AAAAAAAAAC CAATGTTTTG CAGTTTTTTT CATTGCCAAA AACTAAATGG TGCTTTATAT 5520 

TTAGATTGGA AAGAATTTCA TATGCAAAGC ATATTAAAGA GAAAGCCCGC T TTAGTCAAT 5580 

ACTTTTTTGT AAATGGCAAT GCAGAATATT TTGTTATTGG CCTTTTCTAT TCCTGTAATG 5640 

45 AAAGCTGTTT GTCGTAACTT GAAATTTTAT CTTTTACTAT GGGAGTCACT ATTTATTATT 5700 

GCTTATGTGC CCTGTTCAAA ACAGAGGCAC TTAATTTGAT CTTTTATTTT TCTTTGTTTT 5760 

TATTTTTTTT TTTATTTAGA TGACCAAAGG TCATTACAAC CTGGCTTTTT ATTGTATTTG 5820 

TTTCTGGTCT TTGTTAAGTT CTATTGGAAA AACCACTGTC TGTGTTTTTT TGGCAGTTGT 5880 

CTGCATTAAC CTGTTCATAC ACCCATTTTG TCCCT TTATT GAAAAAATAA AAAAAATTAA 5940 

50 a 

Seq ID NO: 85 Protein sequence: 
Protein Accession #•• NP_075044.1 

55 1 11 21 31 41 51 

I I I I i I 

MSRRKQGKPQ HLSKREFSPE PLEAILTDDE PDHGPLGAPE GDHDLLTCGQ CQMNFPLGDI 60 

LIFIEHKRKQ CNGSLCLEKA VDKPPSPSPI EMKKASNPVE VGIQVTPEDD DCLSTSSRRI 120 

CPKQEHIADK LLHWRGLSSP RSAHGALIPT PGMSAEYAPQ GICKDEPSSY TCTTCKQPFT 180 
60 SAWFLLQHAQ NTHGLRIYLE SEHGSPLTPR VGIPSGLGAE CPSQPPLHGI HIADNNPFNL 240 

LRIPGSVSRE ASGLAEGRFP PTPPLFSPPP RHHLDPHRIE RLGAEEMALA THHPSAFDRV 300 

LRLNPMAMEP PAMDFSRRLR ELAGNTSSPP LSPGRPSPMQ RLLQPFQPGS KPPFLATPPL 360 

PPLQSAPPPS QPPVKSKSCE FCGKTFKFQS NLWHRRSHT GEKPYKCNLC DHACTQASKL 42 0 

KRHMKTHMHK SSPMTVKSDD GLSTASSPEP GTSDLVGSAS SALKSWAKF KSENDPNLIP 4 80 
65 ENGDEEEEED DEEEEEEEEE EEEELTESER VDYGFGLSLE AARHHENSSR GAWGVGDES 540 

RALPDVMQGM VLSSMQHFSE AFHQVLGEKH KRGHLAEAEG HRDTCDEDSV AGESDRIDDG 60 0 

TVNGRGCSPG ESASGGLSKK LLLGSPSSLS PFSKRIKLEK EFDLPPATMP NTENVYSQWLt 660 

AGYAASRQLK DPFLSFGDSR QSPFASSSEH SSENGSLRFS TPPGELDGGI SGRSGTGSGG 720 

STPHISGPGT GRPSSKEGRR SDTCEYCGKV FKNCSNLTVH RRSHTGERPY KCELCNYACA 780 
70 QSSKLTRHMK THGQVGKDVY KCEICKMPFS VYSTLEKHMK KWHSDRVLNN DIKTE 



Seq ID NO: 86 DNA sequence 
Nucleic Acid Accession #: XM_035292.2 
/5 Coding sequence: 53-1576 

1 11 21 31 41 51 

III!)) 

GCTCGCTGGG CCGCGGCTCC CGGGTGTCCC AGGCCCGGCC GGTGCGCAGA GCATGGCGGG 60 

80 TGCGGGCCCG AAGCGGCGCG CGCTAGCGGC GCCGGCGGCC GAGGAGAAGG AAGAGGCGCG 120 

GGAGAAGATG CTGGCCGCCA AGAGCGCGGA CGGCTCGGCG CCGGCAGGCG AGGGCGAGGG 180 

CGTGACCCTG CAGCGGAACA TCACGCTGCT CAACGGCGTG GCCATCATCG TGGGGACCAT 240 

TATCGG CTCG GGCATCTTCG TGACGCCCAC GGGCGTGCTC AAGGAGGCAG GCTCGCCGGG 300 

GCTGGCGCTG GTGGTGTGGG CCGCGTGCGG CGTCTTCTCC ATCGTGGGCG CGCTCTGCTA 360 

85 CGCGGAGCTC GGCACCACCA TCTCCAAATC GGGCGGCGAC TACGCCTACA TGCTGGAGGT 420 

CTACGGCTCG CTGCCCGCCT TCCTCAAGCT CTGGATCGAG CTGCTCATCA TCCGGCCTTC 480 

ATCGCAGTAC AT CGTGGCCC TGGTCTTCGC CACCTACCTG CTCAAGCCGC TCTTCCCCAC 540 
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CTGCCCGGTG CCCGAGGAGG CAGCCAAGCT CGTGGCCTGC CTCTGCGTGC TGCTGCTCAC 
GGCCGTGAAC TGCTACAGCG TGAAGGCCGC CACCCGGGTC CAGGATGCCT TTGCCGCCGC 
CAAGCTCCTG GCCCTGGCCC TGAT CATCCT GCTGGGCTTC GTCCAGATCG GGAAGGGTGA 
TGTGTCCAAT CTAGATCCCA ACTTCTCATT TGAAGGCACC AAACTGGATG TGGGGAACAT 
TGTGCTGGCA TTATACAGCG GCCTCTTTGC CTATGGAGGA TGGAATTACT TGAATTTCGT 
CACAGAGGAA ATGATCAACC CCTACAGAAA CCTGCCCCTG GCCATCATCA TCTCCCTGCC 
CATCGTGACG CTGGTGTACG TGCTGACCAA CCTGGCCTAC TTCACCACCC TGTCCACCGA 
GCAGATGCTG TCGTCCGAGG CCGTGGCCGT GGACTT CGGG AACTATCACC TGGGCGT CAT 
GTCCTGGATC ATCCCCGTCT TCGTGGGCCT GTCCTGCTTC GGCTCCGTCA ATGGGTCCCT 
GTTCACATCC TCCAGGCTCT TCTTCGTGGG GTCCCGGGAA GGCCACCTGC CCTCCATCCT 
CTCCATGATC CACCCACAGC TCCTCACCCC CGTGCCGTCC CTCGTGTTCA CGTGTGTGAT 
GACGCTGCTC TACGCCTTCT CCAAGGACAT CTTCTCCGTC ATCAACTTCT TCAGCTTCTT 
CAACTGGCTC TGCGTGGCCC TGGCCATCAT CGGCATGATC TGGCTGCGCC ACAGAAAGCC 
TGAGCTTGAG CGGCCCATCA AGGTGAACCT GGCCCTGCCT GTGTTCTTCA TCCTGGCCTG 
CCTCTTCCTG ATCGCCGTCT CCTTCTGGAA GACACCCGTG GAGTGTGGCA TCGGCTTCAC 
CATCATCCTC AGCGGGCTGC CCGTCTACTT CTTCGGGGTC TGGTGGAAAA ACAAGCCCAA 
GTGGCTCCTC CAGGGCATCT TCTCCACGAC CGTCCTGTGT CAGAAGCTCA TGCAGGTGGT 
CCCCCAGGAG ACATAGCCAG GAGGCCGAGT GGCTGCCGGA GGAGCATGC 

Seq ID NO: 87 Protein sequence: 
Protein Accession #: XP_0352 92.2 

1 11 21 31 41 51 

I I I I I I 

MAGAGPKRRA LAAPAAEEKE EAREKMLAAK SADGSAPAGE GEGVTLQRNI TLLNGVAI IV 
GTIIGSGIFV TPTGVLKEAG SPGLAIiWWA ACGVFSIVGA LCYAELGTTI SKSGGDYAYM 
LEVYGSLPAF LKLWIELDII RPSSQYIVAL VFATYLLKPL FPTCPVPEEA AKLVACLCVL 
LLTAVNCYSV KAATRVQDAF AAAKLLALAL IILLGFVQIG KGDVSNLDPN FSFEGTKLDV 
GNIVLALYSG LFAYGGWNYL NFVTEEMINP YRNLPLAI I I SLPIVTLVYV LTNLAYFTTL 
STEQMLSSEA VAVDFGNYHL GVMSWIIPVF VGLSCFGSVN GSLFTSSRLF FVGSREGHLP 
SILSMIHPQL LTPVPSLVFT CVMTLLYAFS KDIFSVINFF SFFNWLCVAL AIIGMIWLRH 
RKPELERPIK VNLALPVFFI LACLFL I AVS FWKTPVECGI GFTIILSGLP VYFFGVWWKN 
KPKWLLQGIF STTVLCQKLM QWPQET 



Seq ID NO: 88 DNA sequence 

Nucleic Acid Accession #: NM_005268.1 

Coding sequence: 168-989 

1 11 21 31 41 51 

I I I I I 1 

TAAAAAGCAA AAGAATTCGC GGCCGCGTCG ACACGGGCTT CCCCGAAAAC CTTCCCCGCT 

TCTGGATATG AAATTCAAGC TGCTTGCTGA GTCCTATTGC CGGCTGCTGG GAGCCAGGAG 

AGCCCTGAGG AGTAGTCACT CAGTAGCAGC TGACGCGTGG GTCCACCATG AACTGGAGTA 

TCTTTGAGGG ACTCCTGAGT GGGGTCAACA AGTACTCCAC AGCCTTTGGG CGCATCTGGC 

TGTCTCTGGT CTTCATCTTC CGCGTGCTGG TGTACCTGGT GACGGCCGAG CGTGTGTGGA 

GTGATGACCA CAAGGACTTC GACTGCAATA CTCGCCAGCC CGGCTGCTCC AACGTCTGCT 

TTGATGAGTT CTTCCCTGTG TCCCATGTGC GCCTCTGGGC CCTGCAGCTT ATCCTGGTGA 

CATGCCCCTC ACTGCTCGTG GTCATGCACG TGGCCTACCG GGAGGTTCAG GAGAAGAGGC 

ACCGAGAAGC CCATGGGGAG AACAGTGGGC GCCTCTACCT GAACCCCGGC AAGAAGCGGG 

GTGGGCTCTG GTGGACATAT GTCTGCAGCC TAGTGTTCAA GGCGAGCGTG GACATCGCCT 

TTCTCTATGT GTTCCACTCA TTCTACCCCA AATATATCCT CCCTCCTGTG GTCAAGTGCC 

ACGCAGATCC ATGTCCCAAT ATAGTGGACT GCTTCATCTC CAAGCCCTCA GAGAAGAACA 

TTTTCACCCT CTTCATGGTG GCCACAGCTG CCATCTGCAT CCTGCTCAAC CTCGTGGAGC 

TCATCTACCT GGTGAGCAAG AGATGCCACG AGTGCCTGGC AG CAAGGAAA GCTCAAGCCA 

TGTGCACAGG TCATCACCCC CACGGTACCA CCTCTTCCTG CAAACAAGAC GACCTCCTTT 

CGGGTGACCT CATCTTTCTG GGCT CAGACA GTCATCCTCC TCTCTTACCA GACCGCCCCC 

GAGACCATGT GAAGAAAACC ATCTTGTGAG GGGCTGCCTG GACTGGTCTG GCAGGTTGGG 

CCTGGATGGG GAGGCTCTAG CATCTCTCAT AGGTGCAACC TGAGAGTGGG GGAGCTAAGC 

CATGAGGTAG GGGCAGG CAA GAGAGAGGAT TCAGACG CTC TGGGAGCCAG TTCCTAGTCC 

TCAACTCCAG CCACCTGCCC CAGCTCGACG GCACTGGGCC AGTTCCCCCT CTGCTCTGCA 

GCTCGGTTTC CTTTTCTAGA ATGGAAATAG TGAGGGCCAA TGC 

Seq ID NO: 89 Protein sequence: 
Protein Accession #: NP_005259.1 

1 11 21 31 41 51 

I I I I I I 

MNWSIFEGLL SGVNKYSTAF GRIWLSLVFI FRVLVYLVTA ERVWSDDHKD FDCNTRQPGC 
SNVCFDEFFP VSHVRLWALQ LILVTCPSLL WMHVAYREV QEKRHREAHG ENSGRLYLNP 
GKKRGGLWWT YVCSLVFKAS VD I AFLYVFH SFYPKYILPP WKCHADPCP NIVDCFISKP 
SEKNIFTLFM VATAAICILL NLVELIYLVS KRCHECLAAR KAQAMCTGHH PHGTTSSCKQ 
DDLLSGDLIF LGSDSHPPLL PDRPRDHVKK TIL 



Seq ID NO: 90 DNA sequence 

Nucleic Acid Accession #: NM_0023 91.1 

Coding sequence: 26-457 

1 11 21 31 41 51 

I I I I I I 

CGGGCGAAGC AGCGCGGGCA GCGAGATGCA GCACCGAGGC TTCCTCCTCC TCACCCTCCT 
CGCCCTGCTG GCGCTCACCT CCGCGGTCGC CAAAAAGAAA GATAAGGTGA AGAAGGGCGG 
CCCGGGGAGC GAGTGCGCTG AGTGGGCCTG GGGGCCCTGC ACCCCCAGCA GCAAGGATTG 
CGGCGTGGGT TTCCGCGAGG GCACCTGCGG GGCCCAGACC CAGCGCATCC GGTGCAGGGT 
GCCCTGCAAC TGGAAGAAGG AGTTTGGAGC CGACTGCAAG TACAAGTTTG AGAACTGGGG 
TGCGTGTGAT GGGGGCACAG GCACCAAAGT CCGCCAAGGC ACCCTGAAGA AGGCGCGCTA 
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CAATGCTCAG TGCCAGGAGA CCATCCGCGT CACCAAGCCC TGCACCCCCA AGACCAAAGC 
AAAGGCCAAA GCCAAGAAAG GGAAGGGAAA GGACTAGACG CCAAGCCTGG ATGCCAAGGA 
GCCCCTGGTG TCACATGGGG CCTGGCCACG CCCTCCCTCT CCCAGGCCCG AGATGTGACC 
CACCAGTGCC TTCTGTCTGC TCGTTAGCTT TAATCAATCA TGCCCTGCCT TGTCCCTCTC 
ACTCCCCAGC CCCACCCCTA AGTGCCCAAA GTGGGGAGGG ACAAGGGATT CTGGGAAGCT 
TGAGCCTCCC CCAAAGCAAT GTGAGTCCCA GAGCCCGCTT TTGTTCTTCC CCACAATTCC 
ATTACTAAGA AACACATCAA ATAAACTGAC TTTTTCCCCC CAATAAAAGC TCTTCTTTTT 
TAATAT 

Seq ID NO: 91 Protein sequence: 
Protein Accession #: NP_002382.1 

1 11 21 31 41 51 

11)111 
MQHRGFLLLT LL ALL ALTS A VAKKKDKVKK GGPGSECAEW AWGPCTPSSK DCGVGFREGT 

CGAQTQR IRC RVPCNWKKEF GADCKYKFEN WGACDGGTGT KVRQGThKKA RYNAQCQETI 

RVTKPCTPKT KAKAKAKKGK GKD 



Seq ID NO: 92 DNA sequence 

Nucleic Acid Accession #: NM_005130.1 

Coding sequence: 98-802 

1 11 21 31 41 51 

I 1 1 I 1 I 

CTCTACCTGA CACAGCTGCA GCCTGCAATT CACTCCCACT GCCTGGGATT GCACTGGATC 

CGTGTGCTCA GAACAAGGTG AACGCCCAGC TGCAGCCATG AAGATCTGTA GCCTCACCCT 

GCTCTCCTTC CTCCTACTGG CTGCTCAGGT GCTCCTGGTG GAGGGGAAAA AAAAAGTGAA 

GAATGGACTT CACAGCAAAG TGGT CTCAGA ACAAAAGGAC ACTCTGGGCA ACACCCAGAT 

TAAGCAGAAA AGCAGGCCCG G G AACAAAGG CAAGTTTGTC ACCAAAGACC AAGCCAACTG 

CAGATGGGCT GCTACTGAGC AGGAGGAGGG CATCTCTCTC AAGGTTGAGT GCACTCAATT 

GGACCATGAA TTTTCCTGTG TCTTTGCTGG CAATCCAACC TCATGCCTAA AGCTCAAGGA 

TGAGAGAGTC TATTGGAAAC AAGTTGCCCG GAATCTGCGC TCACAGAAAG ACAT CTGTAG 

ATATTCCAAG ACAGCTGTGA AAACCAGAGT GTGCAGAAAG GATTTTCCAG AATCCAGTCT 

TAAGCTAGTC AGCTCCACTC TATTTGGGAA CACAAAGCCC AGGAAGGAGA AAACAGAGAT 

GTCCCCCAGG GAGCACATCA AGGGCAAAGA GACCACCCCC TCTAGCCTAG CAGTGACCCA 

GACCATGGCC ACCAAAGCTC CCGAGTGTGT GGAGGACCCA GATATGGCAA ACCAGAGGAA 

GACTGCCCTG GAGTTCTGTG GAGAGACTTG GAGCTCTCTC TGCACATTCT TCCTCAGCAT 

AGTGCAGGAC ACGTCATGCT AATGAGGTCA AAAGAGAACG GGTTCCTTTA AGAGATGTCA 

TGTCGTAAGT CCCTCTGTAT ACTTTAAAGC TCTCTACAGT CCCCCCAAAA TATGAACTTT 

TGTGCTTAGT GAGTGCAACG AAATATTTAA ACAAGTTTTG TATTTTTTGC TTTTGTGTTT 

TGGAATTTGC CTTATTTTTC TTGGATGCGA TGTT CAGAGG CTGTTTCCTG CAGCATGTAT 

TTCCATGGCC CACACAGCTA TGTGTTTGAG CAGCGAAGAG TCTTTGAGCT GAATGAGCCA 

GAGTGATAAT TTCAGTGCAA CGAACTTTCT GCTGAATTAA TGGTAATAAA ACTCTGGGTG 

TTTTTCAAAA AAAAAAAAAA AAA 

Seq ID NO: 93 Protein sequence: 
Protein Accession #: NP_005121.1 

1 11 21 31 41 51 

I 1 I I I 1 

MKICSLTLLS FLLLAAQVLL VEGKKKVKNG LHSKWSEQK DTLGNTQIKQ KSRPGNKGKF 

VTKDQANCRW AATEQEEGIS LKVECTQLDH EFSCVFAGNP TSCLKLKDER VYWKQVARNL 

RSQKDICRYS KTAVKTRVCR KDFPESSLKL VSSTLFGNTK PRKEKTEMSP REHIKGKETT 

PSSLAVTQTM ATKAPECVED PDMANQRKTA LEFCGETWSS LCTFFLSIVQ DTSC 

Seq ID NO: 94 DNA sequence 

Nucleic Acid Accession #: NM__012101 

Coding sequence: 125-18 91 

1 11 21 31 41 51 

I I I I I I 

CTCCTCACAG GTGTGTCTCT AGTCCTCGTG GTTGCCTGCC CCACTCCCTG CCGAGACGCC 
TGCCAGAAAG GTCACCTATC CTGAACCCCA GCAAGCCTGA AACAGCTCAG CCAAGCACCC 
TGCGATGGAA GCTG CAGATG CCTCCAGGAG CAACGGGTCG AGCCCAGAAG CCAGGGATGC 
CCGGAGCCCG TCGGGCCCCA GTGGCAGCCT GGAGAATGGC ACCAAGGCTG ACGGCAAGGA 
TGCCAAGACC ACCAACGGGC ACGGCGGGGA GGCAGCTGAG GGCAAGAGCC TGGG CAGCGC 
CCTGAAGCCA GGGGAAGGTA GGAGCGCCCT GTTCGCGGGC AATGAGTGGC GGCGACCCAT 
CATCCAGTTT GTCGAGTCCG GGGACGACAA GAACTCCAAC TACTTCAGCA TGGACTCTAT 
GGAAGGCAAG AGGTCGCCGT ACGCAGGGCT CCAGCTGGGG GCTGCCAAGA AGCCACCCGT 
TACCTTTGCC GAAAAGGGCG ACGTGCGCAA GTCCATTTTC TCGGAGTCCC GGAAGCCCAC 
GGTGTCCATC ATGGAGCCCG GGGAGACCCG GCGGAACAGC TACCCCCGGG CCGACACGGG 
CCTTTTTTCA CGGTCCAAGT CCGGCTCCGA GGAGGTGCTG TGCGACTCCT GCATCGGCAA 
CAAGCAGAAG GCGGTCAAGT CCTGCCTGGT GTGCCAGGCC TCCTTCTGCG AGCTGCATCT 
CAAGCCCCAC CTGGAGGGCG CCGCCTTCCG AGACCACCAG CTGCTCGAGC CCATCCGGGA 
CTTTGAGGCC CGCAAGTGTC CCGTGCATGG CAAGACGATG GAGCTCTTCT GCCAGACCGA 
CCAGACCTGC ATCTGCTACC TTTGCATGTT CCAGGAGCAC AAGAATCATA GCACCGTGAC 
AGTGGAGGAG GCCAAGGCCG AGAAGGAGAC GGAGCTGTCA CTGCAAAAGG AGCAGCTGCA 
GCTCAAGATC ATTGAGATTG AGGATGAAGC TGAGAAGTGG CAGAAGGAGA AGGACCGCAT 
CAAGAG CTTC ACCACCAATG AGAAGGCCAT CCTGGAGCAG AACTTCCGGG ACCTGGTGCG 
GGACCTGGAG AAGCAAAAGG AGGAAGTGAG GGCTGCGCTG GAGCAGCGGG AGCAGGATGC 
TGTGGACCAA GTGAAGGTGA TCATGGATGC TCTGGATGAG AGAGCCAAGG TGCTGCATGA 
GGACAAGCAG ACCCGGGAGC AGCTGCATAG CATCAGCGAC TCTGTGTTGT TTCTGCAGGA 
ATTTGGTGCA TTGATGAGCA ATTACTCTCT CCCCCCACCC CTGCCCACCT ATCATGTCCT 
GCTGGAGGGG GAGGGCCTGG GACAGTCACT AGGCAACTTC AAGGACGACC TGCTCAATGT 
ATGCATGCGC CACGTTGAGA AGATGTGCAA GGCGGACCTG AGCCGTAACT TCATTGAGAG 
GAACCACATG GAGAACGGTG GTGACCATCG CTATGTGAAC AACTACACGA ACAGCTTCGG 
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GGGTGAGTGG AGTGCACCGG 
TGGGGTCCGG ACATCATACC 
GAAGAATTTC AACAATCTCT 
CTCCTCCAGC ATTCAGAACT 
CTCCCTGAAA GGCTATCCCT 
TTGGAAATCT GGCAAGCAGA 
CAACGGGATT GGGTCCAACG 
CCCCTGCTCT TCCTCCTGAC 
TGGGAGGGAG CCTGGTCCTG 
GTTCCGGCCT CTCCGACTTC 
TGACCTCAGA TGGT CAC CAT 
TAGGTTGGGG CCTGCCCTAA 
CAGTGAGTAC CCGCATGGTA 
CT AT AG AC GT TTCTCTCCAA 
ACAGCCACCC ATCTCCCATT 
GTGCTCTCTC TCGTCCTACC 
CTGCAGATGG AAACCTCTCA 
ACAGCCACTT TGAGTCTGTG 
TAGCCAAGAT ATTCCTCTGT 
TCCACCCATG CAAATAGCTA 
TTCAGTCTAC ACTTTGGCAT 
GTGCCTTACA CACTGCCCCC 
TGATTACCCC CCATGTTGCA 
AGCAGCACAG TGGGGACATC 
GATGGGCCAG CTTGCAGGGG 
ATAAACCATT GGTCTGTC 
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ACACCATGAA 

AGCCCTCGTC 

ATGGCACCAA 

CTGACAATGA 

CCCTCATGCG 

CTATGCTGTC 

AAGCCCCATG 

CCTGCTGCTC 

CACCTGCCCT 

CCCACTGGCC 

CATTCCTGTG 

CCCGCCAGCC 

TCAGCCTGCC 

GGCCCTATCC 

CACATGGCCC 

TATCAATGCC 

GTGTCTTGAC 

GTCCCTGGAG 

TCCCTCTGCT 

CTGGCCCAGC 

TCTCTCTGGC 

ACCCTCAGCC 

TAT CAGGGTG 

TCCCGTCTCA 

TTGGGGAGGG 



GAGATACTCC 

TCCTGGCCGC 

AGGTAACTAC 

CCTGCCCGTC 

GAGCCAAAGC 

TCACTACCGG 

AGCTCCTGGC 

TTGCCTTCTA 

CTGCAGCCCT 

ACACTCCATT 

CTCAGAGGCC 

TCCTCCTCTC 

TCTCCCGCCC 

CCCAATGTTG 

ACCTCCTGCT 

CAGCATGGCA 

ATCACCCTAC 

GGTGGCTTCT 

GAGATAAAGA 

TACCATTTAC 

GATGGAGTGT 

GTTGCCCCAT 

CT CAAGGATT 

ACAGCCCCAG 

AGACATCCAG 



ATGTACCTGA 

TTCACCAAGG 

ACCTCCCGGG 

GTCCAAGGCA 

CCCAAGGCCC 

CCATTCTACG 

GGAAGGAACG 

AGCTACTGTG 

CTGCCAGCCT 

CAGACTCCTT 

AACCCATCAC 

GGGCTGGATC 

ACGCCCTGCT 

TCAGCAGATG 

TCCCAGAGGA 

GAACCTGCAG 

CCAGGCGGTG 

CCTGACTGGC 

ATTCCCTTAA 

CATTTGCCTA 

GGCTGGGCTG 

CAGAGGCTGC 

GGAGAGGAGA 

GCCTATGGGG 

CTTGGGCTTT 



CACCCAAAGG 

AGACCACCCA 

TCTGGGAGTA 

GCTCCTCCTT 

AGCCCCAGAC 

TCAACAAAGG 

AGGCGCCACA 

CTTGTCTGGG 

CT TGGGGGCA 

TCCTGCCTTG 

AGGGGTGAGA 

TGGGGGCTAG 

GTCTCCAGGC 

CCTGGACAGC 

CTGGCCCTAC 

TGGCCAAGGG 

GGTCTCCACC 

AGGATGACCT 

CATGATATAA 

CAGAATTTCA 

ACCGCAAAAG 

CTCCTCCTTC 

CAAAACCAGG 

GCTCTGGAAG 

CCCCTTTGGA 



Seq ID NO: 95 Protein sequence: 
Protein Accession #: NP_036233.1 



1 

MEAADASRSN 
KPGEGRSAIiF 
FAEKGDVRKS 
QKAVKSCLVC 
TCICYLCMFQ 
SFTTNEKAIL 
KQTREQLHSI 
MRHVEKMCKA 
VRTSYQPSSP 
LKGYPSLMRS 



11 
I 

GSSPEARDAR 

AGNEWRRP I I 

IFSESRKPTV 

QASFCELHLK 

EHKNHSTVTV 

EQNFRDLVRD 

SDSVLFLQEF 

DLSRNFIERN 

GRFTKETTQK 

QSPKAQPQTW 



21 
I 

SPSGPSGSLE 
QFVESGDDKN 
SIMEPGETRR 
PHLEGAAFRD 
EEAKAEKETE 
LEKQKEEVRA 
GALMSNYSLP 
HMENGGDHRY 
NFNNLYGTKG 
KSGKQTMLSH 



31 
I 

NGTKADGKDA 
SNYFSMDSME 
NSYPRADTGL 
HQLLEPIRDF 
LSLQKEQLQL 
ALEQREQDAV 
PPLPTYHVLL 
VNNYTNSFGG 
NYTSRVWEY S 
YRPFYVNKGN 



41 

i 

KTTNGHGGEA 
GKRSPYAGLQ 
FSRSKSGSEE 
EARKCPVHGK 
KIIEIEDEAE 
DQVKVIMDAL 
EGEGLGQSLG 
EWSAPDTMKR 
SSIQNSDNDL 
GIGSNEAP 



51 



AEGKSLGSAL 
LGAAKKPPVT 
VLCDSCIGNK 
TMELFCQTDQ 
KWQKEKDRIK 
DERAKVLHED 
NFKDDLLNVC 
YSMYLTPKGG 
PWQGSSSFS 



Seq ID NO: 96 DNA sequence 

Nucleic Acid Accession # NM_080668.1 

Coding sequence: 83-841 



85 



GGCACGAGGG 

GAGCTCGAGA 

GCGCTCCGGG 

AGGCTCTGAA 

AGTCAGAAAG 

CCAATCACCT 

TGGCAGGGAG 

CAGCACTCCT 

CAGAG ACT TG 

CTCTGCCTCT 

GGCAGAAGAC 

GGTTTGTGCA 

GAAACAGAAA 

GGCTGCGGCC 

AGATGCAGTG 

CCTGTGGAGA 

GCTGCGCATG 

TTAGGAAATG 

CCTTCCTATC 

GAATCAGTGG 

CTTGTTGGGA 

CCCTCCTGAG 

TTCAGTTCCG 

GAGGGCAATT 

AAGGATGTAG 

GTTTTCTAGT 

GCTGCTTGGA 

GCTCATGGCC 

TGCAGGGGTG 

ACCGAGTCTA 

CAACTATGCT 

ATAGCAATTT 

CTCATGATCT 

TTTGGATTTG 

TTTGATGTTT 

CAGAGAATGC 

AGGCGGGCCC 



11 

i 

CAGCGAGTGG 

CGGAG CCTAG 

CCAAGGGCCC 

CTCCCGAGCA 

CCCATCGTCT 

CGCAGGAGCC 

CTTACTAAGG 

GTGCCGAACC 

GAAATGTCTA 

ACCTCCACCC 

TTGTCCGGAG 

AAGCCCTGGG 

CGTAAGAAGA 

ATGAATGCCG 

GGGGGTGCAC 

GGACACTTAG 

AGGACTGTCT 

GGGCCGCCTG 

TCCCCAAAGT 

CCCAGCCAGA 

GGGGTGGCTG 

TTGCCTTCTG 

TGGGTTTCCC 

CTGTCTTGGA 

GGAGCCTTAG 

TCTGGTCTGC 

GCAAAGGGTG 

TCTGGGCTGG 

GAAGGTGGCC 

CTTGGCCCTA 

TGTAAAGTCC 

TAGTTTTTGG 

CTGGAGAATT 

AAGGCTGCCC 

AGAAGTTCGT 

CAGGGAAGAT 

TAATAAAACC 



21 



CCTTCCCGGT 

TTATGTCTGG 

CATCTCCTAC 

TCCTCCCTGA 

TAAAGAGGAT 

CTAGGATTTC 

AGGACCTTTT 

CTGAGGCCGA 

AGAAAGTCAG 

CAGGCCGCCG 

TCTCGCCAGT 

CCCCAGACAT 

AGAAAATGCC 

AGTTTGAAGC 

CTGGCCAGAC 

GGTCCCCTCC 

GCCTTTGAGG 

GCCCAGCCAC 

ACCATAGCCA 

AGTTAAAGGG 

CTTGGAAATA 

TTGGTGGCTT 

CTTTGATTCT 

GGAAGAAGCT 

TTGGGTCTCA 

TGTTGAGATG 

CATTTCAGGG 

TCCCTTGCAC 

CCTCTTGTCA 

GAAGAGAAAG 

TCGGAAAGTT 

CCTCCCTATC 

TCCCCATCTT 

TGCCCCCGAC 

GGAAGTAGAC 

GAGTGCTGGG 

CTCTGCCAGG 



31 
I 

TGGCGCGCGC 
GAGGCGAACG 
TAAGCCTCTG 
AATCTGGCCG 
CGTGGCCCAT 
CTTTTTCTTG 
CAAGACACAC 
GTCCAGCTCC 
GCGTTCCTAC 
GTCCTGCTTT 
GGTGTGCTCC 
GACTCTCCCT 
AGAGATCTTG 
TGCTGAGCAG 
TCTCCCTCCT 
CCTGGTCTTG 
GCTTGGGCAG 
TCACTGGTGT 
GTTTCCAGAT 
CTGAGGGTTG 
GGCCCAGGGG 
TCTTCTTGAA 
GTAAATAGTC 
GGACATTCAG 
GACCATAAGT 
TTTGGTAAAT 
TGTGGCCACC 
AGGGCCCACG 
CCCATACCCA 
TTGAAGAGTC 
TCCTCGCGTA 
* CTCTCACATG 
TCTCTTCTTT 
TCTCCTGCCG 
GCTGAGGTGT 
TCAGGGTACT 
TCTGGGAGTC 



41 

1 

CCGGGGCGGC 

CGGT CCGGAG 

CGGAGGTCCC 

AAGACACCCA 

GCTGTAGAGG 

GAGAAAGAAA 

AGCGTCCCTG 

AAGGAAGGAG 

AGCCGGCTGG 

GGCTTCGAGG 

AAACT CACCG 

GGAATCTCCC 

AAAACGGAGC 

TTTGATCTCC 

GTCCTGTACA 

TTACCTGTGT 

CAGCGGCAGC 

CCTGTCTCTT 

GGGCCACAGA 

AGGTGAGAGG 

CTCTGCCAGC 

CCCACCTGTG 

CCAGAGAGAA 

CCTGTGGAGT 

GTGTACTACA 

GCCAGGTTGA 

AGGTGCTGTG 

CTGGAGTCTT 

TTTCTTACAA 

CCAGACCTAC 

CCAGACAGCG 

AGAACACTGC 

CCATCGTGTG 

CACCCCTGGC 

GCAGAGGAGC 

TGGATGAAAC 

CCAGGCCATC 



1560 

1620 

1680 

1740 

1800 

1860 

1920 

1980 

2040 

2100 

2160 

2220 

2280 

2340 

2400 

2460 

2520 

2580 

2640 

2700 

2760 

2820 

2880 

2940 

3000 



51 

1 

GGCGCTGGAG 

GAGCCGCTCA 

AGCGGAAATC 

GTGCGGCTGC 

TCCCAGCTGT 

ACGAGCCCCC 

CCACCCCCAC 

AGCTGGACGC 

AGACCCTGGG 

GGCTGCTGGG 

AGGTCCCCAG 

CACCACCCGA 

TGGATGAGTG 

TGGTTGAATG 

TAGCCACCTC 

GTGTGCTGGT 

CATCTTGGTT 

GTCGTCCTGT 

CTGGGGAGGA 

CACCTCTGCT 

CTCGGCCTCT 

TAAAGAGGTT 

TTCGTGGGCT 

CTGAGTTTTG 

CAGAAGCTGT 

TAGGGCGCTG 

AGTTTCTGTG 

ACCACTCTGC 

AATAAGTTAC 

TAGCATTTTG 

GCGGGGGCTG 

CTGGATGCAT 

GATTCAATAG 

CATTGTACCT 

TGGT GGATAA 

GGTGCAGGCC 

TGCTCAACGC 



60 
120 
180 
240 
300 
360 
420 
480 
540 



60 
120 
180 
240 
300 
360 
420 
480 
540 
600 
660 
72 0 
780 
840 
900 
960 
1020 
1080 
1140 
1200 
1260 
1320 
1380 
1440 
1500 
1560 
1620 
1680 
1740 
1800 
1860 
1920 
1980 
2040 
2100 
2160 
2220 



224 



